diff options
author | Martin Fischer <martin@push-f.com> | 2021-03-03 16:38:37 +0100 |
---|---|---|
committer | Martin Fischer <martin@push-f.com> | 2021-03-03 16:41:28 +0100 |
commit | 30099b5d9b616b820341b70582f26685597cebe5 (patch) | |
tree | a86d86629b7bf260bf056e6e9c8c3e024aab0d04 /scrapers/at.py | |
parent | 294ec05490f639c08d69d010f769b8d60aa3650d (diff) |
differentiate between abbreviations and redirects
Diffstat (limited to 'scrapers/at.py')
-rwxr-xr-x | scrapers/at.py | 10 |
1 files changed, 10 insertions, 0 deletions
diff --git a/scrapers/at.py b/scrapers/at.py index bc4d874..1af9894 100755 --- a/scrapers/at.py +++ b/scrapers/at.py @@ -50,6 +50,16 @@ for page in pages: ) if 'Abkuerzung' in info: data['abbr'] = info['Abkuerzung'].strip() + data['redir'] = data['abbr'].lower()\ + .replace(')', '')\ + .replace('(', '')\ + .replace(' – ', '-')\ + .replace(' ', '-')\ + .replace('\xa0', '-')\ + .replace('ä', 'ae')\ + .replace('ü', 'ue')\ + .replace('ö', 'oe')\ + .replace('ß', 'ss') normen[info['Gesetzesnummer']] = data with open('laws/at.json', 'w') as f: |