develop
gwen 3 years ago
parent 91beaf2772
commit c47620101c

@ -1,5 +1,4 @@
# ________________________________________________________________________ # ________________________________________________________________________
# reading raw bourbon dataset # reading raw bourbon dataset
bourbon: bourbon:
type: actesdataset.XMLDataSetCollection type: actesdataset.XMLDataSetCollection
@ -11,23 +10,6 @@ bourbon_content:
type: actesdataset.XMLDataSetCollection type: actesdataset.XMLDataSetCollection
housename: bourbon housename: bourbon
folderpath: data/02_intermediate/houses/bourbon folderpath: data/02_intermediate/houses/bourbon
# ________________________________________________________________________
actors:
type: pandas.CSVDataSet
filepath: data/01_raw/csv/actors.csv
load_args:
sep: ";"
corpus-agnes-bourgogne:
type: pandas.CSVDataSet
filepath: data/01_raw/csv/corpus-agnes-bourgogne.csv
load_args:
sep: ";"
corpus-charles-i:
type: pandas.CSVDataSet
filepath: data/01_raw/csv/corpus-charles-i.csv
load_args:
sep: ";"

@ -19,8 +19,6 @@ def parse_xml_collection(datasets, param):
# FIXME set signature # FIXME set signature
# datasets -> dict # datasets -> dict
# param -> str # param -> str
# logger.info("~~~~~~~~~~~~~~~~~~~~~~~~~~~~~")
# logger.info(str(bourbon))
output_datasets = dict() output_datasets = dict()
# datasets = bourbon.get_datasets() # datasets = bourbon.get_datasets()
for dataset_filenamestem, dataset in datasets.items(): for dataset_filenamestem, dataset in datasets.items():

@ -10,11 +10,6 @@ from kedro.io import AbstractDataSet, DataSetError
from kedro.framework.session import KedroSession from kedro.framework.session import KedroSession
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
# FIXME : ça n'est plus utile
# we need the context here to have access to the config
with KedroSession.create() as session:
context = session.load_context()
class XMLDataSet: class XMLDataSet:
"lxml.etree._ElementTree loader" "lxml.etree._ElementTree loader"
@ -83,8 +78,6 @@ class XMLDataSetCollection(AbstractDataSet):
folderpath: str): folderpath: str):
self._housename = housename self._housename = housename
self._folderpath = Path(folderpath) self._folderpath = Path(folderpath)
# self.house_path = Path(context.get_houses()[self._housename]['path'])
# print(self.house_path)
def get_datasets(self): def get_datasets(self):
if hasattr(self, 'datasets'): if hasattr(self, 'datasets'):

Loading…
Cancel
Save