diff --git a/src/param.py b/src/param.py index d7bea6a..0c76e1c 100644 --- a/src/param.py +++ b/src/param.py @@ -41,9 +41,12 @@ class Params(BaseModel): # optional parameter to configure output keep_data_files: bool = True - database_name: str = 'dataset.db' + # optional parameter to provide result output + precision: str = 'day' + resolution: int = 5000 + # stuff that we do not change in the tool base_path: str = '/out' netcdf_backend: NetCDFBackends = NetCDFBackends.XARRAY diff --git a/src/tool.yml b/src/tool.yml index 2bcf39f..0340dfe 100644 --- a/src/tool.yml +++ b/src/tool.yml @@ -27,9 +27,30 @@ tools: type: datetime description: | The end date of the datasetm, if a time dimension applies to the dataset. - # integrate dataset - # mode of operation - # keep intermediate files + integration: + type: enum + values: + - none + - all + - sptatial + - temporal + description: | + The mode of operation for the integration of each all data files associated to each data source + into a common DuckDB-based dataset. This dataset includes data for a unified spatial and temporal + extent and includes macros for aggregation. By setting `integration` the default integrations are + selected. The resulting database can still be used to query different aggregation levels. + - `none`: No integration will be performed and the DuckDB database will **NOT** be created. + - `all`: Temporal and spatial scale aggregations will be integrated, if the scale is defined in the dataset metadata. + - `spatial`: Only results for spatial aggregations will be provided. + - `temporal`: Only results for temporal aggregations will be provided. + optional: true + keep_data_files: + type: boolean + optional: true + description: | + If set to `false`, the data files clipped to the spatial and temporal scale as defined in the + data-source metadata will not be kept. This saves a lot of disk space for the output. + If set to `true` (default behavior), then there will be a `/out/datasets` directory in the output. connection: type: string optional: true