From 7c7ad6d20fe61c97c642ea2862ea860e673e7071 Mon Sep 17 00:00:00 2001 From: Fabian Wachsmann <k204210@l40052.lvt.dkrz.de> Date: Wed, 18 Oct 2023 11:42:17 +0200 Subject: [PATCH] Added cloud eerie --- esm-collections/cloud-access/dkrz_eerie.yaml | 26 +++++++++++++ esm-collections/disk-access/dkrz_catalog.yaml | 37 +++++++++++-------- esm-collections/disk-access/dkrz_eerie.yaml | 26 +++++++++++++ 3 files changed, 74 insertions(+), 15 deletions(-) create mode 100644 esm-collections/cloud-access/dkrz_eerie.yaml create mode 100644 esm-collections/disk-access/dkrz_eerie.yaml diff --git a/esm-collections/cloud-access/dkrz_eerie.yaml b/esm-collections/cloud-access/dkrz_eerie.yaml new file mode 100644 index 0000000..c005e9b --- /dev/null +++ b/esm-collections/cloud-access/dkrz_eerie.yaml @@ -0,0 +1,26 @@ +sources: + dkrz_eerie_kerchunk: + args: + path: "{{CATALOG_DIR}}/dkrz_eerie_kerchunk.yaml" + description: This catalog contains datasets for all raw data in /work/bm1344 and accesses the data via kerchunks in /work/bm1344/DKRZ/kerchunks + driver: yaml_file_cat + dkrz_eerie_archive: + args: + path: "{{CATALOG_DIR}}/dkrz_eerie_archive.yaml" + description: This catalog contains datasets for archived data in /arch/bm1344 + driver: yaml_file_cat + dkrz_eerie_xpublish: + args: + path: "{{CATALOG_DIR}}/dkrz_eerie_xpublish.yaml" + description: This catalog contains the same datasets as *dkrz_eerie_kerchunk* but data access is via the xpublish server *eerie.cloud.dkrz.de* + driver: yaml_file_cat + dkrz_eerie_evaluation: + args: + path: "{{CATALOG_DIR}}/dkrz_eerie_evaluation.yaml" + description: This catalog contains additional EERIE evaluation data from /work/bm1344/DKRZ + driver: yaml_file_cat + dkrz_catalog: + args: + path: "https://gitlab.dkrz.de/data-infrastructure-services/intake-esm/-/raw/master/esm-collections/cloud-access/dkrz_catalog.yaml" + description: DKRZ master catalog for all /pool/data catalogs available + driver: yaml_file_cat diff --git a/esm-collections/disk-access/dkrz_catalog.yaml b/esm-collections/disk-access/dkrz_catalog.yaml index 1a7fafe..874e118 100755 --- a/esm-collections/disk-access/dkrz_catalog.yaml +++ b/esm-collections/disk-access/dkrz_catalog.yaml @@ -4,16 +4,17 @@ metadata: additional_cmip6_disk_columns: default: - units - - path - opendap_url + - path - long_name type: list[str] additional_era5_disk_columns: default: + - step - path - - units - - long_name - short_name + - long_name + - units type: list[str] cataloonie_columns: default: @@ -41,6 +42,7 @@ plugins: sources: dkrz_cmip5_archive: args: + obj: '{{CATALOG_DIR}}/dkrz_cmip5_archive.json' read_csv_kwargs: usecols: - project @@ -58,13 +60,13 @@ sources: - uri - format - jblob_file - obj: '{{CATALOG_DIR}}/dkrz_cmip5_archive.json' description: This is an ESM collection for CMIP5 data accessible on the DKRZ's cera archive driver: - intake.open_esm_datastore dkrz_cmip5_disk: args: + obj: '{{CATALOG_DIR}}/dkrz_cmip5_disk.json' read_csv_kwargs: usecols: - project @@ -81,13 +83,13 @@ sources: - temporal_subset - uri - format - obj: '{{CATALOG_DIR}}/dkrz_cmip5_disk.json' description: This is an ESM collection for CMIP5 data accessible on the DKRZ's Lustre disk storage system in /work/kd0956/CMIP5/data/cmip5/ driver: - intake.open_esm_datastore dkrz_cmip6_cloud: args: + obj: '{{CATALOG_DIR}}/dkrz_cmip6_cloud.json' read_csv_kwargs: usecols: - project @@ -102,12 +104,13 @@ sources: - version - uri - format - obj: '{{CATALOG_DIR}}/dkrz_cmip6_cloud.json' description: This is an ESM collection for CMIP6 data accessible on DKRZ's swift cloud store - driver: intake_esm.esm_datastore + driver: + - intake.open_esm_datastore dkrz_cmip6_disk: args: + obj: '{{CATALOG_DIR}}/dkrz_cmip6_disk.json' read_csv_kwargs: usecols: - project @@ -124,12 +127,12 @@ sources: - time_range - uri - format - obj: '{{CATALOG_DIR}}/dkrz_cmip6_disk.json' description: This is a ESM-collection for CMIP6 data on DKRZ's disk storage system driver: - intake.open_esm_datastore dkrz_cordex_disk: args: + obj: '{{CATALOG_DIR}}/dkrz_cordex_disk.json' read_csv_kwargs: usecols: - project @@ -147,13 +150,13 @@ sources: - time_range - uri - format - obj: '{{CATALOG_DIR}}/dkrz_cordex_disk.json' - description: This is an ESM collection for CORDEX data accessible on the DKRZ's + description: 'This is an ESM collection for CORDEX data accessible on the DKRZ''s disk storage system ' driver: - intake.open_esm_datastore dkrz_dyamond-winter_disk: args: + obj: '{{CATALOG_DIR}}/dkrz_dyamond-winter_disk.json' read_csv_kwargs: usecols: &id001 - project @@ -173,12 +176,17 @@ sources: - format - uri - variable_id - obj: '{{CATALOG_DIR}}/dkrz_dyamond-winter_disk.json' description: Default catalog for ICON-ESM experiments by MPIMet driver: - intake.open_esm_datastore + dkrz_eerie: + args: + path: '{{CATALOG_DIR}}/dkrz_eerie.yaml' + description: EERIE Data at DKRZ + driver: yaml_file_cat dkrz_era5_disk: args: + obj: '{{CATALOG_DIR}}/dkrz_era5_disk.json' read_csv_kwargs: usecols: - project @@ -193,7 +201,6 @@ sources: - initialization_date - uri - format - obj: '{{CATALOG_DIR}}/dkrz_era5_disk.json' description: This is an ESM collection for ERA5 data accessible on the DKRZ's disk storage system in /work/bk1099/data/ driver: @@ -205,6 +212,7 @@ sources: driver: yaml_file_cat dkrz_mpige_disk: args: + obj: '{{CATALOG_DIR}}/dkrz_mpige_disk.json' read_csv_kwargs: usecols: - product_id @@ -220,7 +228,6 @@ sources: - version - uri - format - obj: '{{CATALOG_DIR}}/dkrz_mpige_disk.json' description: This is an ESM collection for the Max Planck Institute Grand Ensemble (Maher et al. 2019 https://doi.org/10/gf3kgt) cmorized by CMIP5-standards accessible on the DKRZ's Levante disk storage system in /work/mh1007/CMOR/MPI-GE @@ -228,14 +235,15 @@ sources: - intake.open_esm_datastore dkrz_nextgems_disk: args: + obj: '{{CATALOG_DIR}}/dkrz_nextgems_disk.json' read_csv_kwargs: usecols: *id001 - obj: '{{CATALOG_DIR}}/dkrz_nextgems_disk.json' description: Default catalog for ICON-ESM experiments by MPIMet driver: - intake.open_esm_datastore dkrz_palmod2_disk: args: + obj: '{{CATALOG_DIR}}/dkrz_palmod2_disk.json' read_csv_kwargs: usecols: - project @@ -250,7 +258,6 @@ sources: - format - time_range - uri - obj: '{{CATALOG_DIR}}/dkrz_palmod2_disk.json' description: This is a ESM-collection for Palmod2 data on DKRZ's disk storage system driver: diff --git a/esm-collections/disk-access/dkrz_eerie.yaml b/esm-collections/disk-access/dkrz_eerie.yaml new file mode 100644 index 0000000..c005e9b --- /dev/null +++ b/esm-collections/disk-access/dkrz_eerie.yaml @@ -0,0 +1,26 @@ +sources: + dkrz_eerie_kerchunk: + args: + path: "{{CATALOG_DIR}}/dkrz_eerie_kerchunk.yaml" + description: This catalog contains datasets for all raw data in /work/bm1344 and accesses the data via kerchunks in /work/bm1344/DKRZ/kerchunks + driver: yaml_file_cat + dkrz_eerie_archive: + args: + path: "{{CATALOG_DIR}}/dkrz_eerie_archive.yaml" + description: This catalog contains datasets for archived data in /arch/bm1344 + driver: yaml_file_cat + dkrz_eerie_xpublish: + args: + path: "{{CATALOG_DIR}}/dkrz_eerie_xpublish.yaml" + description: This catalog contains the same datasets as *dkrz_eerie_kerchunk* but data access is via the xpublish server *eerie.cloud.dkrz.de* + driver: yaml_file_cat + dkrz_eerie_evaluation: + args: + path: "{{CATALOG_DIR}}/dkrz_eerie_evaluation.yaml" + description: This catalog contains additional EERIE evaluation data from /work/bm1344/DKRZ + driver: yaml_file_cat + dkrz_catalog: + args: + path: "https://gitlab.dkrz.de/data-infrastructure-services/intake-esm/-/raw/master/esm-collections/cloud-access/dkrz_catalog.yaml" + description: DKRZ master catalog for all /pool/data catalogs available + driver: yaml_file_cat -- GitLab