openjdk.rb 4.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152
  1. module Docs
  2. class Openjdk < FileScraper
  3. self.name = 'OpenJDK'
  4. self.type = 'openjdk'
  5. self.root_path = 'overview-summary.html'
  6. self.links = {
  7. home: 'https://openjdk.java.net/',
  8. code: 'https://github.com/openjdk/jdk'
  9. }
  10. html_filters.insert_after 'internal_urls', 'openjdk/clean_urls'
  11. options[:skip_patterns] = [
  12. /compact[123]-/,
  13. /package-frame\.html/,
  14. /package-tree\.html/,
  15. /package-use\.html/,
  16. /class-use\//,
  17. /doc-files\//,
  18. /\.svg/,
  19. /\.png/
  20. ]
  21. options[:only_patterns] = [
  22. /\Ajava\./,
  23. /\Ajdk\./
  24. ]
  25. options[:attribution] = <<-HTML
  26. &copy; 1993, 2022, Oracle and/or its affiliates. All rights reserved.<br>
  27. Documentation extracted from Debian's OpenJDK Development Kit package.<br>
  28. Licensed under the GNU General Public License, version 2, with the Classpath Exception.<br>
  29. Various third party code in OpenJDK is licensed under different licenses (see Debian package).<br>
  30. Java and OpenJDK are trademarks or registered trademarks of Oracle and/or its affiliates.
  31. HTML
  32. NEWFILTERS = ['openjdk/entries_new', 'openjdk/clean_html_new']
  33. version '18' do
  34. self.release = '18'
  35. self.root_path = 'index.html'
  36. self.base_url = 'https://docs.oracle.com/en/java/javase/18/docs/api/'
  37. html_filters.push NEWFILTERS
  38. options[:container] = 'main'
  39. end
  40. version '17' do
  41. self.release = '17'
  42. self.root_path = 'index.html'
  43. self.base_url = 'https://docs.oracle.com/en/java/javase/17/docs/api/'
  44. html_filters.push NEWFILTERS
  45. options[:container] = 'main'
  46. end
  47. OLDFILTERS = ['openjdk/entries', 'openjdk/clean_html']
  48. version '11' do
  49. self.release = '11.0.11'
  50. self.root_path = 'index.html'
  51. self.base_url = 'https://docs.oracle.com/en/java/javase/11/docs/api/'
  52. html_filters.push OLDFILTERS
  53. end
  54. version '8' do
  55. self.release = '8'
  56. self.base_url = 'https://docs.oracle.com/javase/8/docs/api/'
  57. html_filters.push OLDFILTERS
  58. options[:only_patterns] = [
  59. /\Ajava\/beans\//,
  60. /\Ajava\/io\//,
  61. /\Ajava\/lang\//,
  62. /\Ajava\/math\//,
  63. /\Ajava\/net\//,
  64. /\Ajava\/nio\//,
  65. /\Ajava\/security\//,
  66. /\Ajava\/text\//,
  67. /\Ajava\/time\//,
  68. /\Ajava\/util\//,
  69. /\Ajavax\/annotation\//,
  70. /\Ajavax\/crypto\//,
  71. /\Ajavax\/imageio\//,
  72. /\Ajavax\/lang\//,
  73. /\Ajavax\/management\//,
  74. /\Ajavax\/naming\//,
  75. /\Ajavax\/net\//,
  76. /\Ajavax\/print\//,
  77. /\Ajavax\/script\//,
  78. /\Ajavax\/security\//,
  79. /\Ajavax\/sound\//,
  80. /\Ajavax\/tools\//
  81. ]
  82. end
  83. version '8 GUI' do
  84. self.release = '8'
  85. self.base_url = 'https://docs.oracle.com/javase/8/docs/api/'
  86. html_filters.push OLDFILTERS
  87. options[:only_patterns] = [
  88. /\Ajava\/awt\//,
  89. /\Ajavax\/swing\//
  90. ]
  91. end
  92. version '8 Web' do
  93. self.release = '8'
  94. self.base_url = 'https://docs.oracle.com/javase/8/docs/api/'
  95. html_filters.push OLDFILTERS
  96. options[:only_patterns] = [
  97. /\Ajava\/applet\//,
  98. /\Ajava\/rmi\//,
  99. /\Ajava\/sql\//,
  100. /\Ajavax\/accessibility\//,
  101. /\Ajavax\/activation\//,
  102. /\Ajavax\/activity\//,
  103. /\Ajavax\/jws\//,
  104. /\Ajavax\/rmi\//,
  105. /\Ajavax\/sql\//,
  106. /\Ajavax\/transaction\//,
  107. /\Ajavax\/xml\//,
  108. /\Aorg\/ietf\//,
  109. /\Aorg\/omg\//,
  110. /\Aorg\/w3c\//,
  111. /\Aorg\/xml\//]
  112. end
  113. # Monkey patch to properly read HTML files encoded in ISO-8859-1
  114. def read_file(path)
  115. File.read(path).force_encoding('iso-8859-1').encode('utf-8') rescue nil
  116. end
  117. def get_latest_version(opts)
  118. doc = fetch_doc("https://jdk.java.net/archive/", opts)
  119. version = doc.at_css('#downloads > table > tr > th').content
  120. version.gsub!(/\(.*\)/, '')
  121. version.gsub!(/[a-zA-z]/, '')
  122. version
  123. end
  124. end
  125. end