diff --git a/app/data.py b/app/data.py new file mode 100644 index 0000000..59b26fd --- /dev/null +++ b/app/data.py @@ -0,0 +1,23 @@ +from bs4 import BeautifulSoup + +def make_soup(file): + with open(file, 'r', encoding="utf-8") as opening: + xml = BeautifulSoup(opening, 'xml') + return xml + +def get_places(file): + soup = make_soup(file) + for div in soup.find_all('div', {'xml:id': True}): + print(div['n']) + for place in div.find_all('placeName', {'type': 'production_place'}): + print(place.text) + + +def get_archives(file): + soup = make_soup(file) + for div in soup.find_all('orgName', {'type': 'main'}): + print(div.text) + + + +get_archives("../bourbon-latex/charles-actes-latex.xml")