get catalog

develop
gwen 3 years ago
parent 1991698e5c
commit 55b6990228

@ -22,6 +22,12 @@ class ProjectContext(KedroContext):
houses = self.config_loader.get("houses*") houses = self.config_loader.get("houses*")
return houses['raw_datapath'] return houses['raw_datapath']
def get_catalog(self):
"catalog loader entry point"
# loading yaml defined catalogs
catalog = self.config_loader.get('catalog*')
return catalog
# def _get_catalog(self, *args, **kwargs): # def _get_catalog(self, *args, **kwargs):
# "catalog loader entry point" # "catalog loader entry point"
# # loading yaml defined catalogs # # loading yaml defined catalogs

@ -18,7 +18,7 @@ def parse_xml_collection(datasetcollection: XMLDataSetCollection) -> Dict[str, E
# the dataset **is not** registered in kedro's catalog # the dataset **is not** registered in kedro's catalog
dataset._load() dataset._load()
descr = dataset._describe() descr = dataset._describe()
logger.info(f"dataset {descr} loaded") # logger.info(f"dataset {descr} loaded")
output_source_doc = dataset.transform() output_source_doc = dataset.transform()
# set dataset's output filepath # set dataset's output filepath
# output_filepath = dataset.filepath.replace("01_raw", "02_intermediate") # output_filepath = dataset.filepath.replace("01_raw", "02_intermediate")

@ -1,7 +1,19 @@
import logging
from kedro.pipeline import Pipeline, node, pipeline from kedro.pipeline import Pipeline, node, pipeline
from .nodes import parse_xml_collection from .nodes import parse_xml_collection
from kedro.framework.session import KedroSession
logger = logging.getLogger(__name__)
with KedroSession.create() as session:
context = session.load_context()
catalog = context.get_catalog()
bourbon = catalog['bourbon_xmlcontent']
logger.info("+++++++++++++++++++" + bourbon['folderpath'])
def create_pipeline(**kwargs) -> Pipeline: def create_pipeline(**kwargs) -> Pipeline:
return pipeline( return pipeline(

Loading…
Cancel
Save