# _________________________________________________________________________ # loading some data catalogs actors: type: pandas.CSVDataSet filepath: data/01_raw/csv/actors.csv load_args: sep: ";" corpus-agnes-bourgogne: type: pandas.CSVDataSet filepath: data/01_raw/csv/corpus-agnes-bourgogne.csv load_args: sep: ";" corpus-charles-i: type: pandas.CSVDataSet filepath: data/01_raw/csv/corpus-charles-i.csv load_args: sep: ";" # _________________________________________________________________________ # custom csv dataset test sample dataset_test: type: myowndataset.MyOwnDataSet filepath: data/01_raw/csv/actors.csv load_args: sep: ";" preprocessed_dataset_test: type: myowndataset.MyOwnDataSet filepath: data/02_intermediate/csv/preprocessed_test_dataset.csv save_args: sep: ";" # _________________________________________________________________________ # custom xml dataset sample load_xml: type: actesdataset.XMLDataSet filepath: data/01_raw/xml/Anjou/anj_is_i_1441_08_05a.xml preprocess_html: type: actesdataset.XMLDataSet filepath: data/02_intermediate/xml/Anjou/anj_is_i_1441_08_05a.html # _________________________________________________________________________ preprocessed_actors: type: pandas.CSVDataSet filepath: data/02_intermediate/csv/preprocessed_actors.csv save_args: sep: ";"