185 lines
7.5 KiB
Ruby
185 lines
7.5 KiB
Ruby
# frozen_string_literal: true
|
|
|
|
URL = "https://outline-rocks.github.io/wcag/translations/WCAG21-de/"
|
|
WCAG_22_EN_URL ="https://www.w3.org/TR/WCAG22/"
|
|
WCAG_22_EN_QREF_URL = "https://www.w3.org/WAI/WCAG22/quickref/"
|
|
|
|
def translate(input)
|
|
DeepL.translate(input, "EN", "DE")
|
|
end
|
|
|
|
def import_wcag22en
|
|
doc = Nokogiri::HTML5(URI.open(WCAG_22_EN_URL))
|
|
qrefdoc = Nokogiri::HTML5(URI.open(WCAG_22_EN_QREF_URL))
|
|
quick_criteria = qrefdoc.css(".guidelines section:has(h4)").each_with_object({}) do |node, h|
|
|
h[node.css("h4 strong").first.content] = {
|
|
quick_criterion_en: node.css(".sc-content .sc-text p").first.content,
|
|
link_url: node.css(".understanding a").first.attribute("href").value,
|
|
perm_url: "#{WCAG_22_EN_QREF_URL}##{node.css("article").first.attribute("id").value}"
|
|
}
|
|
rescue
|
|
debugger
|
|
end
|
|
link_category = LinkCategory.find_by(name: "Verstehen")
|
|
qr_category = LinkCategory.find_by(name: "WCAG Quick Reference")
|
|
# debugger
|
|
# raise ActiveRecord::Rollback
|
|
|
|
standards = [ Standard.find_by(name_de: "WCAG 2.2"), Standard.find_by(name_de: "EN 301 549") ]
|
|
doc.css("section.principle").each do |principle_node|
|
|
_principle_id = principle_node.attributes["id"].value
|
|
principle_title = principle_node.css("h2").first.content.scan(/([a-zA-Z]+)/)
|
|
principle = Principle.find_or_create_by!(name_en: principle_title)
|
|
|
|
principle_node.css("section.guideline").each do |guideline_node|
|
|
next unless guideline_node.css("h3").first
|
|
|
|
puts guideline_node.css("h3").first&.content
|
|
puts guideline_node.css_path
|
|
|
|
g_title = guideline_node.css("h3")
|
|
.first
|
|
.content
|
|
.scan(/Guideline \d+\.\d+ (.*)/)
|
|
.first
|
|
.first
|
|
g_number = guideline_node.css("h3 bdi")
|
|
.first
|
|
.content
|
|
.scan(/\d+\.(\d+)/)
|
|
.first
|
|
.first
|
|
g_text = guideline_node.css("> p").first.content
|
|
|
|
guideline = Guideline.find_or_create_by(principle: principle, number: g_number, name_en: g_title)
|
|
guideline.update(description_en: g_text, description_de: translate(g_text), name_de: translate(g_title)) if guideline.description_de.blank?
|
|
|
|
guideline_node.css("section.guideline").each do |sc|
|
|
puts sc.css_path
|
|
puts sc.css("h4 bdi")
|
|
sc_number, sc_title = sc.css("h4")
|
|
.first
|
|
.content
|
|
.scan(/Success Criterion \d+\.\d+\.(\d+) (.*)/)
|
|
.first
|
|
sc_level = sc.css("p.conformance-level").first&.content&.scan(/\(Level (A+)\)/)&.first&.last
|
|
sc_url = sc.css("a.self-link").first.attr("href")
|
|
sc_conformity_notice = sc.css("div.note p").to_a.map(&:to_s).join("\n")
|
|
full_text = sc.children
|
|
.select { _1.class == Nokogiri::XML::Element }
|
|
.select { _1.attr("class").nil? || _1.attr("class") == "note" }
|
|
.reduce("") { |str, node| str + node.to_s }
|
|
|
|
check = Check.find_or_initialize_by(guideline_id: guideline.id, number: sc_number)
|
|
new_standards = Set.new(check.standards)
|
|
new_standards += standards
|
|
check.name_de = translate sc_title if check.name_de.blank?
|
|
check.name_en = sc_title
|
|
check.standards = new_standards
|
|
check.applicable_to_app = check.applicable_to_web = true
|
|
check.external_url = "#{WCAG_22_EN_URL}#{sc_url}"
|
|
check.conformity_level = sc_level&.to_sym
|
|
check.conformity_notice_de = translate sc_conformity_notice
|
|
check.criterion_de = "<div>#{translate full_text}</div>".gsub('href="#', %(href="#{WCAG_22_EN_URL}#)) if check.criterion_de.blank?
|
|
qref_attrs = quick_criteria["#{principle.id}.#{guideline.number}.#{sc_number}"]
|
|
check.quick_criterion_en = qref_attrs&.dig :quick_criterion_en
|
|
check.quick_criterion_de = qref_attrs&.dig :quick_criterion_en
|
|
|
|
if qref_attrs&.dig(:link_url)
|
|
link = Link.find_or_create_by(link_category:, url: qref_attrs[:link_url])
|
|
link.update(text: "#{check.full_number} Verstehen")
|
|
check.links << link
|
|
end
|
|
|
|
if qref_attrs&.dig(:perm_url)
|
|
link = Link.find_or_create_by(link_category: qr_category, url: qref_attrs[:perm_url])
|
|
link.update(text: "#{check.full_number} Quick Reference")
|
|
check.links << link
|
|
end
|
|
# check.criterion_details_en = qref_attrs&.dig :criterion_details_en
|
|
# check.criterion_details_de = qref_attrs&.dig :criterion_details_en
|
|
check.save!
|
|
end
|
|
end
|
|
end
|
|
@output
|
|
end
|
|
|
|
def import_wcag21de
|
|
doc = Nokogiri::HTML5(URI.open(URL))
|
|
|
|
standard = Standard.find_by(name_de: "WCAG 2.1")
|
|
|
|
doc.css("section.principle").each do |principle_node|
|
|
_principle_id = principle_node.attributes["id"].value
|
|
principle_title = principle_node.css("h2").first.content.scan(/[\d\.]+ ([a-zA-ZöäüÖÄÜ]+)/)
|
|
principle = Principle.find_by!(name_de: principle_title)
|
|
|
|
principle_node.css("section.guideline").each do |guideline_node|
|
|
# puts guideline_node.attr("id")
|
|
# puts guideline_node.css("h3").size
|
|
# next unless guideline_node.css("h3").first
|
|
|
|
guideline_title = guideline_node.css("h3").first.content
|
|
guideline_text = guideline_node.css("p").first
|
|
|
|
guideline_number = guideline_title.scan(/Richtlinie \d+\.(\d+).*/).first.last
|
|
# guideline = principle.guidelines.find_or_create_by(number: guideline_number)
|
|
# guideline.title = guideline_title.scan(/Richtlinie \d+\.\d+(.*)/).first.last
|
|
# guideline.text = guideline_text
|
|
|
|
# guideline.save!
|
|
|
|
guideline_node.css("section.sc").each do |sc|
|
|
sc_title = sc.css("h4").first.content.scan(/Erfolgskriterium \d+\.\d+\.\d+ (.*)/).first.last
|
|
sc_number = sc.css("h4").first.content.scan(/Erfolgskriterium (\d+\.\d+\.\d+).*/).first.last
|
|
sc_level = sc.css("p").first.content.scan(/\(Stufe (A+)\)/).first.last
|
|
sc_url = sc.css("h4 a.self-link").first.attr("href")
|
|
sc_conformity_notice = sc.css("div.note p").first&.content
|
|
text = "<div>#{guideline_text}<br>#{sc.css('p')[1]}"
|
|
text += "<p>#{sc.css('dl').first&.to_s}</p>" if sc.css("dl").first
|
|
|
|
|
|
# _sc_number = sc_title.scan(/Erfolgskriterium \d+\.\d+\.(\d+).*/).first.last
|
|
|
|
check = Check.find_or_initialize_by(external_number: sc_number)
|
|
check.name_de = sc_title
|
|
check.principle = principle
|
|
check.standards << standard unless check.standards.include?(standard)
|
|
check.applicable_to_app = check.applicable_to_web = true
|
|
check.external_number = sc_number
|
|
check.external_url = "#{URL}#{sc_url}"
|
|
check.conformity_level = sc_level.to_sym
|
|
check.conformity_notice_de = sc_conformity_notice
|
|
check.criterion_de = "#{text}</div>".gsub('href="#', %(href="#{URL}#))
|
|
check.save!
|
|
end
|
|
end
|
|
end
|
|
@output
|
|
end
|
|
|
|
namespace :import do
|
|
desc "Import WCAG2.1 in german"
|
|
task wcag21de: :environment do
|
|
Check.transaction do
|
|
import_wcag21de
|
|
# raise ActiveRecord::Rollback
|
|
end
|
|
end
|
|
|
|
desc "Import WCAG2.2 in english"
|
|
task wcag22en: :environment do
|
|
Check.transaction do
|
|
import_wcag22en
|
|
# raise ActiveRecord::Rollback
|
|
end
|
|
end
|
|
|
|
desc "Import EN 301 549"
|
|
task en301549de: :environment do
|
|
Check.transaction do
|
|
import_en301549de
|
|
end
|
|
end
|
|
end
|