devdocs/lib/docs/scrapers/mdn/html.rb
2024-08-20 20:25:09 +02:00

32 lines
1 KiB
Ruby

module Docs
class Html < Mdn
prepend FixInternalUrlsBehavior
# release = '2024-08-20'
self.name = 'HTML'
self.base_url = 'https://developer.mozilla.org/en-US/docs/Web/HTML'
self.links = {
home: 'https://developer.mozilla.org/en-US/docs/Web/HTML',
code: 'https://github.com/mdn/content/tree/main/files/en-us/web/html'
}
html_filters.push 'html/clean_html', 'html/entries'
options[:root_title] = 'HTML'
options[:replace_paths] = {
'/Element/h1' => '/Element/Heading_Elements',
'/Element/h2' => '/Element/Heading_Elements',
'/Element/h3' => '/Element/Heading_Elements',
'/Element/h4' => '/Element/Heading_Elements',
'/Element/h5' => '/Element/Heading_Elements',
'/Element/h6' => '/Element/Heading_Elements',
'/Global_attributes/data-%2A' => '/Global_attributes/data-*' }
options[:fix_urls] = ->(url) do
url.sub! 'https://developer.mozilla.org/en-US/docs/HTML/', "#{Html.base_url}/" unless url.include?('Content_categories')
url
end
end
end