initial commit
parent
7dc7034c0c
commit
d7dee3a5b7
@ -0,0 +1,23 @@
|
||||
from bs4 import BeautifulSoup
|
||||
|
||||
def make_soup(file):
|
||||
with open(file, 'r', encoding="utf-8") as opening:
|
||||
xml = BeautifulSoup(opening, 'xml')
|
||||
return xml
|
||||
|
||||
def get_places(file):
|
||||
soup = make_soup(file)
|
||||
for div in soup.find_all('div', {'xml:id': True}):
|
||||
print(div['n'])
|
||||
for place in div.find_all('placeName', {'type': 'production_place'}):
|
||||
print(place.text)
|
||||
|
||||
|
||||
def get_archives(file):
|
||||
soup = make_soup(file)
|
||||
for div in soup.find_all('orgName', {'type': 'main'}):
|
||||
print(div.text)
|
||||
|
||||
|
||||
|
||||
get_archives("../bourbon-latex/charles-actes-latex.xml")
|
||||
Loading…
Reference in New Issue