| 123456789101112131415161718192021222324252627282930313233343536373839404142 |
- module Docs
- class C < FileScraper
- self.type = 'c'
- self.base_url = 'http://en.cppreference.com/w/c/'
- self.root_path = 'header.html'
- html_filters.insert_before 'clean_html', 'c/fix_code'
- html_filters.push 'c/entries', 'c/clean_html', 'title'
- text_filters.push 'c/fix_urls'
- options[:decode_and_clean_paths] = true
- options[:container] = '#content'
- options[:title] = false
- options[:root_title] = 'C Programming Language'
- options[:skip] = %w(language/history.html)
- options[:skip_patterns] = [/experimental/]
- options[:fix_urls] = ->(url) do
- url.sub! %r{\A.+/http%3A/}, 'http://'
- url.sub! 'http://en.cppreference.com/upload.cppreference.com', 'http://upload.cppreference.com'
- url
- end
- options[:attribution] = <<-HTML
- © cppreference.com<br>
- Licensed under the Creative Commons Attribution-ShareAlike Unported License v3.0.
- HTML
- def get_latest_version(opts)
- doc = fetch_doc('https://en.cppreference.com/w/Cppreference:Archives', opts)
- link = doc.at_css('a[title^="File:"]')
- date = link.content.scan(/(\d+)\./)[0][0]
- DateTime.strptime(date, '%Y%m%d').to_time.to_i
- end
- private
- def file_path_for(*)
- URI.unescape(super)
- end
- end
- end
|