website-risg/laws/euv.toml
philipp 02cc438704
All checks were successful
CI/CD Pipeline / deploy-main (push) Successful in 3m36s
cleaner config
2024-05-26 17:14:08 +02:00

61 lines
1.3 KiB
TOML

[law]
id = 10008048
name = "EUV"
par_sign = "ARTIKEL"
[[law.classifiers]]
name = "Titel"
is_root = true
match_function = "contains"
[[law.classifiers]]
name = "Kapitel"
is_root = false
match_function = "contains"
[[law.classifiers]]
name = "Abschnitt"
is_root = false
match_function = "contains"
[parser]
remove_strings = [
"<tab />",
"<b>", "</b>",
"<i>", "</i>",
"<n>", "</n>",
"<super>", "</super>",
"""<abstand ct="text" halign="l" />"""
]
move_para_headers_into_content = true
[[parser.replace_rules]]
find = "<gdash />"
replace_with = "-"
[[parser.replace_rules]]
find = "Artikel 7"
replace_with = "ARTIKEL 7"
[[parser.replace_rules]]
find = "Artikel 38"
replace_with = "ARTIKEL 38"
[[parser.replace_rules]]
find = "Artikel 42"
replace_with = "ARTIKEL 42"
[[parser.replace_rules]]
find = "+ARTIKEL 48"
replace_with = "ARTIKEL 48"
# Replace all 'erltext's which have subsections...
[[parser.replace_rules]]
find = """<absatz typ="erltext" ct="text" halign="j">("""
replace_with = """<absatz typ="abs" ct="text" halign="j">("""
# ... and replace all 'erltext's which have only one section
[[parser.replace_rules]]
find = """/ueberschrift><absatz typ="erltext" ct="text" halign="j">"""
replace_with = """/ueberschrift><absatz typ="abs" ct="text" halign="j">"""