s2_a3
parent
070d773d51
commit
ea7143df3f
|
@ -0,0 +1,63 @@
|
||||||
|
import re
|
||||||
|
import json
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
person_list = []
|
||||||
|
|
||||||
|
with open("Studienleistung2/Personen.txt") as input:
|
||||||
|
for lines in input:
|
||||||
|
current_line = lines.split(",")
|
||||||
|
|
||||||
|
titel = re.findall(r"([A-Z][a-z]+\.)", current_line[0])
|
||||||
|
|
||||||
|
name = re.findall(r"([A-Z][a-z]+[^\.]*$)", current_line[0])
|
||||||
|
name = re.split("\s", name[0])
|
||||||
|
|
||||||
|
# getting the fragments building the whole name
|
||||||
|
first_name = name[0]
|
||||||
|
|
||||||
|
# if there are more than one second names
|
||||||
|
second_name = ""
|
||||||
|
counter = 1
|
||||||
|
while counter<len(name)-1:
|
||||||
|
second_name = second_name + name[counter] + " "
|
||||||
|
counter += 1
|
||||||
|
|
||||||
|
# -1 to get the last elem of the list name
|
||||||
|
last_name = name[-1]
|
||||||
|
|
||||||
|
|
||||||
|
address = re.findall(r"(.+)([1-9]+).([\d]{5})(.+)", current_line[1])
|
||||||
|
address = address[0]
|
||||||
|
|
||||||
|
street_name = address[0]
|
||||||
|
house_number = address[1]
|
||||||
|
plz = address[2]
|
||||||
|
city = address[3]
|
||||||
|
|
||||||
|
geb_date = re.findall("([0-9][0-9]\.[0-9][0-9]\.[0-9][0-9][0-9][0-9])", current_line[2])
|
||||||
|
tel = re.findall("(\d{12,15})", current_line[3])
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
person = {
|
||||||
|
"titel": titel[0],
|
||||||
|
"Vorname": first_name,
|
||||||
|
"Zweitname": second_name,
|
||||||
|
"Nachname": last_name,
|
||||||
|
"Straße": street_name,
|
||||||
|
"Hausnummer": house_number,
|
||||||
|
"PLZ": plz,
|
||||||
|
"Stadt": city,
|
||||||
|
"Geb.Datum": geb_date[0],
|
||||||
|
"Tel.": tel[0],
|
||||||
|
}
|
||||||
|
|
||||||
|
person_list.append(person)
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
with open("Studienleistung2/Person_Neu.json", "w") as outfile:
|
||||||
|
json.dump(person_list, outfile, indent=2, ensure_ascii=False)
|
Loading…
Reference in New Issue