You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

80 lines
1.9 KiB
YAML

# _________________________________________________________________________
# loading some data catalogs
3 years ago
actors:
type: pandas.CSVDataSet
filepath: data/01_raw/csv/actors.csv
load_args:
sep: ";"
3 years ago
3 years ago
corpus-agnes-bourgogne:
type: pandas.CSVDataSet
filepath: data/01_raw/csv/corpus-agnes-bourgogne.csv
load_args:
sep: ";"
corpus-charles-i:
type: pandas.CSVDataSet
filepath: data/01_raw/csv/corpus-charles-i.csv
load_args:
sep: ";"
# _________________________________________________________________________
# custom csv dataset test sample
dataset_test:
type: myowndataset.MyOwnDataSet
filepath: data/01_raw/csv/actors.csv
load_args:
sep: ";"
preprocessed_dataset_test:
type: myowndataset.MyOwnDataSet
filepath: data/02_intermediate/csv/preprocessed_test_dataset.csv
3 years ago
save_args:
sep: ";"
# _________________________________________________________________________
# custom xml dataset sample
load_xml:
type: actesdataset.XMLDataSet
filepath: data/01_raw/xml/anjou/anj_is_i_1441_08_05a.xml
3 years ago
preprocess_html:
type: actesdataset.XMLDataSet
filepath: data/02_intermediate/xml/anjou/anj_is_i_1441_08_05a.html
3 years ago
# _________________________________________________________________________
# same test with kedro.io.PartitionedDataSet
# warning :
# this kind of yaml data in generated programmatically
# in the generic data loader
#load_full_xml_catalog:
# type: PartitionedDataSet
# path: data/01_raw/xml/anjou/
# dataset:
# type: actesdataset.XMLDataSet
# filename_suffix: '.xml'
#preprocess_full_catalog_html:
# type: PartitionedDataSet
# path: data/02_intermediate/xml/anjou/
# dataset:
# type: actesdataset.XMLDataSet
# filename_suffix: '.html'
# _________________________________________________________________________
preprocessed_actors:
type: pandas.CSVDataSet
filepath: data/02_intermediate/csv/preprocessed_actors.csv
save_args:
sep: ";"