From 444f62256f9f7101b8f5c9f8a1459ba04b6b9052 Mon Sep 17 00:00:00 2001 From: jgenero Date: Thu, 28 Sep 2023 18:57:31 +0200 Subject: [PATCH] fix bug with transcribers XPath in src/actesdataset.py --- actes-princiers/src/actesdataset.py | 13 ++++++++----- 1 file changed, 8 insertions(+), 5 deletions(-) diff --git a/actes-princiers/src/actesdataset.py b/actes-princiers/src/actesdataset.py index e399347..5fb9f6d 100644 --- a/actes-princiers/src/actesdataset.py +++ b/actes-princiers/src/actesdataset.py @@ -86,14 +86,17 @@ class BsXMLDataSet(XMLDataSet): def find_transcribers(self): "find transcriber xml bs4 helper" - transcribers = self.soup.find_all('respStmt') + transcribers = self.soup.find_all('teiHeader') trs = [] - for pers in transcribers: - trs_name = pers.find('name') - if trs_name: - trs.append(trs_name.get_text()) + for header in transcribers: + respStmt = header.find('fileDesc').find('titleStmt').find('respStmt') + if respStmt: + trs_name = respStmt.find('name') + if trs_name: + trs.append(trs_name.get_text()) return trs + def find_prince_name(self): """find prince_name xml bs4 helper