diff --git a/actes-princiers/src/actes_princiers/pipelines/xml_processing/nodes.py b/actes-princiers/src/actes_princiers/pipelines/xml_processing/nodes.py index 0736d03..a2fa204 100755 --- a/actes-princiers/src/actes_princiers/pipelines/xml_processing/nodes.py +++ b/actes-princiers/src/actes_princiers/pipelines/xml_processing/nodes.py @@ -8,17 +8,17 @@ from actesdataset import EtreeXMLDataSet, XMLDataSetCollection logger = logging.getLogger(__name__) -#with KedroSession.create() as session: -# context = session.load_context() -# catalog = context.get_catalog() +with KedroSession.create() as session: + context = session.load_context() + catalog = context.get_catalog() def parse_xml_collection(datasetcol: XMLDataSetCollection) -> Dict[str, EtreeXMLDataSet]: "node function entry point, performs batch processing" datasets = datasetcol.datasets housename = datasetcol._housename - outputfolderpath = f"data/02_intermediate/houses/{housename}/xml" -# output_catalog = catalog[housename + '_xmlcontent'] -# outputfolderpath = output_catalog['folderpath'] +# outputfolderpath = f"data/02_intermediate/houses/{housename}/xml" + output_catalog = catalog[housename + '_xmlcontent'] + outputfolderpath = output_catalog['folderpath'] output_datasets = dict() for dataset_filenamestem, dataset in datasets.items(): # a manual load is required here, because diff --git a/actes-princiers/src/actes_princiers/pipelines/xml_processing/pipeline.py b/actes-princiers/src/actes_princiers/pipelines/xml_processing/pipeline.py index a5b8313..03827c5 100755 --- a/actes-princiers/src/actes_princiers/pipelines/xml_processing/pipeline.py +++ b/actes-princiers/src/actes_princiers/pipelines/xml_processing/pipeline.py @@ -10,10 +10,16 @@ def create_pipeline(**kwargs) -> Pipeline: node( func=parse_xml_collection, inputs="bourbon", - outputs=None, #"bourbon_xmlcontent", + outputs="bourbon_xmlcontent", name="bourbon_ds_collection", ), # node( +# func=parse_json_collection, +# inputs="bourbon", +# outputs="bourbon_json", +# name="bourbon_json_ds_collection", +# ), +# node( # func=parse_xml_collection, # inputs="berry", # outputs=None, #"berry_xmlcontent",