diff --git a/configs.example/datamodule/configuration/site_example_configuration.yaml b/configs.example/datamodule/configuration/site_example_configuration.yaml new file mode 100644 index 00000000..192ef0a6 --- /dev/null +++ b/configs.example/datamodule/configuration/site_example_configuration.yaml @@ -0,0 +1,125 @@ +general: + description: Example config for producing PVNet samples for a reneweble generation site + name: site_example_config + +input_data: + + site: + # Path to Site data in NetCDF format + file_path: PLACEHOLDER.nc + # Path to metadata in CSV format + metadata_file_path: PLACEHOLDER.csv + time_resolution_minutes: 15 + interval_start_minutes: -60 + # Specified for intraday + interval_end_minutes: 480 + dropout_timedeltas_minutes: null + dropout_fraction: 0 # Fraction of samples with dropout + + gsp: + # Path to GSP data in zarr format + # e.g. gs://solar-pv-nowcasting-data/PV/GSP/v7/pv_gsp.zarr + zarr_path: PLACEHOLDER.zarr + interval_start_minutes: -60 + # Specified for intraday + interval_end_minutes: 480 + time_resolution_minutes: 30 + # Random value from the list below will be chosen as the delay when dropout is used + # If set to null no dropout is applied. Only values before t0 are dropped out for GSP. + # Values after t0 are assumed as targets and cannot be dropped. + dropout_timedeltas_minutes: null + dropout_fraction: 0 # Fraction of samples with dropout + + nwp: + + ecmwf: + provider: ecmwf + # Path to ECMWF NWP data in zarr format + # n.b. It is not necessary to use multiple or any NWP data. These entries can be removed + zarr_path: PLACEHOLDER.zarr + interval_start_minutes: -60 + # Specified for intraday + interval_end_minutes: 480 + time_resolution_minutes: 60 + channels: + - t2m # 2-metre temperature + - dswrf # downwards short-wave radiation flux + - dlwrf # downwards long-wave radiation flux + - hcc # high cloud cover + - mcc # medium cloud cover + - lcc # low cloud cover + - tcc # total cloud cover + - sde # snow depth water equivalent + - sr # direct solar radiation + - duvrs # downwards UV radiation at surface + - prate # precipitation rate + - u10 # 10-metre U component of wind speed + - u100 # 100-metre U component of wind speed + - u200 # 200-metre U component of wind speed + - v10 # 10-metre V component of wind speed + - v100 # 100-metre V component of wind speed + - v200 # 200-metre V component of wind speed + image_size_pixels_height: 24 + image_size_pixels_width: 24 + dropout_timedeltas_minutes: [-360] + dropout_fraction: 1.0 # Fraction of samples with dropout + max_staleness_minutes: null + + ukv: + provider: ukv + # Path to UKV NWP data in zarr format + # e.g. gs://solar-pv-nowcasting-data/NWP/UK_Met_Office/UKV_intermediate_version_7.zarr + # n.b. It is not necessary to use multiple or any NWP data. These entries can be removed + zarr_path: PLACEHOLDER.zarr + interval_start_minutes: -60 + # Specified for intraday + interval_end_minutes: 480 + time_resolution_minutes: 60 + channels: + - t # 2-metre temperature + - dswrf # downwards short-wave radiation flux + - dlwrf # downwards long-wave radiation flux + - hcc # high cloud cover + - mcc # medium cloud cover + - lcc # low cloud cover + - sde # snow depth water equivalent + - r # relative humidty + - vis # visibility + - si10 # 10-metre wind speed + - wdir10 # 10-metre wind direction + - prate # precipitation rate + # These variables exist in CEDA training data but not in the live MetOffice live service + - hcct # height of convective cloud top, meters above surface. NaN if no clouds + - cdcb # height of lowest cloud base > 3 oktas + - dpt # dew point temperature + - prmsl # mean sea level pressure + - h # geometrical? (maybe geopotential?) height + image_size_pixels_height: 24 + image_size_pixels_width: 24 + dropout_timedeltas_minutes: [-360] + dropout_fraction: 1.0 # Fraction of samples with dropout + max_staleness_minutes: null + + satellite: + # Path to Satellite data (non-HRV) in zarr format + # e.g. gs://solar-pv-nowcasting-data/satellite/EUMETSAT/SEVIRI_RSS/v4/2020_nonhrv.zarr + zarr_path: PLACEHOLDER.zarr + interval_start_minutes: -30 + interval_end_minutes: 0 + time_resolution_minutes: 5 + channels: + - IR_016 # Surface, cloud phase + - IR_039 # Surface, clouds, wind fields + - IR_087 # Surface, clouds, atmospheric instability + - IR_097 # Ozone + - IR_108 # Surface, clouds, wind fields, atmospheric instability + - IR_120 # Surface, clouds, atmospheric instability + - IR_134 # Cirrus cloud height, atmospheric instability + - VIS006 # Surface, clouds, wind fields + - VIS008 # Surface, clouds, wind fields + - WV_062 # Water vapor, high level clouds, upper air analysis + - WV_073 # Water vapor, atmospheric instability, upper-level dynamics + image_size_pixels_height: 24 + image_size_pixels_width: 24 + dropout_timedeltas_minutes: null + dropout_fraction: 0 # Fraction of samples with dropout