Skip to content

Instantly share code, notes, and snippets.

@hasechris
Created February 2, 2025 18:44
Show Gist options
  • Save hasechris/fc0e36f424840cf6a152e55d601ae352 to your computer and use it in GitHub Desktop.
Save hasechris/fc0e36f424840cf6a152e55d601ae352 to your computer and use it in GitHub Desktop.
ruleset file for Alman Document scanning
---
set_title:
match: True
metadata_postprocessing:
title: "{{created_year}}-{{created_month}}-{{created_day}}_{{document_type}}_{{correspondent|replace(' ', '_')}}"
...
---
custom_field_bezahlt_pos_terminal_form1:
match: "{{ document_type == 'Einzelrechnung' and 'True' if 'Terminal-ID' in content and 'True' if 'Pos-Info' in content and 'True' if 'Genehmigungs-Nr.' in content }}"
metadata_regex: '(?i)(Datum:)[ ]?(?P<receipt_day>\d{2})[ ]?(\.|,)[ ]?(?P<receipt_month>\d{2})[ ]?(\.|,)[ ]?(?P<receipt_year>\d{4})[\s\S]*(Uhrzeit:)[\s\S]*(Beleg-Nr.)'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ receipt_year + '-' + receipt_month + '-' + receipt_day }}"
...
---
custom_field_eingang_jan:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'JAN' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-01-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_feb:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'FEB' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-02-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_mrz:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'MRZ' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-03-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_apr:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'APR' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-04-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_mai:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'MAI' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-05-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_juni:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'JUNI' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-06-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_juli:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'JULI' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-07-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_aug:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'AUG' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-08-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_sep:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'SEP' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-09-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_okt:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'OKT' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-10-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_nov:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'NOV' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-11-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_eingang_dez:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'EINGANG' in content and 'True' if 'DEZ' in content }}"
metadata_regex: '(?i)(E[ ]?I[ ]?N[ ]?G[ ]?A[ ]?N[ ]?G)[ ]?(?P<received_day>\d{2})[ ]?(\.|,|)[ ]?(?P<received_month>\w{3})[ ]?(\.|,|)[ ]?(?P<received_year>\d{4})'
metadata_postprocessing:
custom_fields:
eingang: "{{ received_year + '-12-' + received_day if received_year is defined and received_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_jan:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'JAN' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-01-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_feb:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'FEB' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-02-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_mrz:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'MRZ' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-03-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_apr:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'APR' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-04-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_mai:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'MAI' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-05-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_juni:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'JUNI' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-06-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_juli:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'JULI' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-07-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_aug:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'AUG' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-08-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_sep:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'SEP' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-09-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_okt:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'OKT' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-10-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_nov:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'NOV' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-11-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_bezahlt_dez:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'BEZAHLT' in content and 'True' if 'DEZ' in content }}"
metadata_regex: '(?i)(B[ ]?E[ ]?Z[ ]?A[ ]?H[ ]?L[ ]?T)[ ]?(?P<bezahlt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<bezahlt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<bezahlt_year>\d{4})'
metadata_postprocessing:
custom_fields:
bezahlt: "{{ bezahlt_year + '-12-' + bezahlt_day if bezahlt_year is defined and bezahlt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_jan:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'JAN' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-01-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_feb:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'FEB' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-02-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_mrz:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'MRZ' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-03-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_apr:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'APR' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-04-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_mai:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'MAI' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-05-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_juni:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'JUNI' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-06-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_juli:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'JULI' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-07-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_aug:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'AUG' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-08-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_sep:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'SEP' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-09-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_okt:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'OKT' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-10-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_nov:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'NOV' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-11-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
---
custom_field_erledigt_dez:
match: "{{ document_type != 'Lohnabrechnung' and 'True' if 'ERLEDIGT' in content and 'True' if 'DEZ' in content }}"
metadata_regex: '(?i)(E[ ]?R[ ]?L[ ]?E[ ]?D[ ]?I[ ]?G[ ]?T)[ ]?(?P<erledigt_day>\d{2})[ ]?(\.|,|)[ ]?(?P<erledigt_month>\w{3})[ ]?(\.|,|)[ ]?(?P<erledigt_year>\d{4})'
metadata_postprocessing:
custom_fields:
erledigt: "{{ erledigt_year + '-12-' + erledigt_day if erledigt_year is defined and erledigt_day is defined else '01-01-1950' }}"
...
@hasechris
Copy link
Author

Bildschirmfoto vom 2025-02-02 19-50-10

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment