|
|
|
|
@ -7,7 +7,7 @@ from actesdataset import EtreeXMLDataSet
|
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def parse_xml_collection(datasets: Dict[str, EtreeXMLDataSet], param: str) -> Dict[str, EtreeXMLDataSet]:
|
|
|
|
|
def parse_xml_collection(datasets: Dict[str, EtreeXMLDataSet]) -> Dict[str, EtreeXMLDataSet]:
|
|
|
|
|
"node function entry point, performs batch processing"
|
|
|
|
|
output_datasets = dict()
|
|
|
|
|
for dataset_filenamestem, dataset in datasets.items():
|
|
|
|
|
@ -18,6 +18,7 @@ def parse_xml_collection(datasets: Dict[str, EtreeXMLDataSet], param: str) -> Di
|
|
|
|
|
logger.info(f"dataset {descr} loaded")
|
|
|
|
|
output_source_doc = dataset.transform()
|
|
|
|
|
# set dataset's output filepath
|
|
|
|
|
# output_filepath = _outputfolderpath
|
|
|
|
|
output_filepath = dataset.filepath.replace("01_raw", "02_intermediate")
|
|
|
|
|
output_xmldataset = EtreeXMLDataSet(output_filepath)
|
|
|
|
|
# let's create subfolders now, if they don't exist
|
|
|
|
|
|