pylokid/test_pdf_parsing.py

22 lines
481 B
Python
Raw Normal View History

2018-01-04 20:26:38 +00:00
import re
import logging
from pprint import pprint
from pathlib import Path
from library.pdf_extract import PDFHandling
PATH = '/tmp/pylokid'
logging.basicConfig(
level=logging.INFO,
format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
)
PDF = PDFHandling()
for path in Path(PATH).glob('**/*.pdf'):
file = str(path)
2018-01-16 08:16:36 +00:00
print(file)
2018-01-04 20:26:38 +00:00
f_id = re.search('.*(F[0-9]{8})_.*', file).group(1)
2018-01-16 08:16:36 +00:00
print(f_id)
2018-01-04 20:26:38 +00:00
pprint(PDF.extract_einsatzausdruck(file, f_id))