Code: Alles auswählen
#!/usr/bin/env python2.7
# encoding: utf-8
import codecs
import os
import glob
from collections import defaultdict
import json
import csv
REPORTS_PATH = "./reports/"
TAGS = {
"charge": u"Schmelzen-Nr./ Heat No. / No.de coule :",
"actual": u"Ist / Actual / Actuel",
"selon": u"Die Lieferung wurde US-geprüft nach / Delivery US-checked acc.to / Livraison contrôlé par ultrasons selon : ",
"doformation": u"Umformgrad/ Hot forming ratio / Ratio de déformation :",
"largeur": u"Durchm./Breite/ Diameter/width / Diamètre/largeur :",
}
TAGS_TWO_LINES = {
"Eprouvette": u"Proben-Nr./Specimen-No./ No.d’eprouvette 1. Prfl. / Spec. / Eprouvette 2. Prfl. / Spec. / Eprouvette 3. Prfl. / Spec. / Eprouvette",
"Probe": u"Rpo.2[MPa (N/mm²)] Rm[MPa (N/mm²)] A5[%] Z[%]",
}
lines = []
for report_filename in glob.iglob(os.path.join(REPORTS_PATH, '*')):
print("\n----- FILE -----")
print(report_filename + "\n")
file_content = codecs.open(report_filename, mode='r', errors='ignore', encoding='utf-8')
data = defaultdict(list)
for line in file_content:
for tag, identifier in TAGS.iteritems():
if line.startswith(identifier):
data[tag].append(line[len(identifier):].strip())
for tag, identifier in TAGS_TWO_LINES.iteritems():
if line.startswith(identifier):
data[tag].append(next(file_content).strip())
lines.append(data)
#excel_export_file.close()
print("\n\n----- JSON DATA -----\n")
print(json.dumps(lines))
print("\n")