diff --git a/nowcasting_dataset/config/gcp.yaml b/nowcasting_dataset/config/gcp.yaml
index 92574e07..4f5ded46 100644
--- a/nowcasting_dataset/config/gcp.yaml
+++ b/nowcasting_dataset/config/gcp.yaml
@@ -6,7 +6,7 @@ input_data:
   satellite_zarr_path: gs://solar-pv-nowcasting-data/satellite/EUMETSAT/SEVIRI_RSS/OSGB36/all_zarr_int16_single_timestep.zarr
   solar_pv_data_filename: gs://solar-pv-nowcasting-data/PV/PVOutput.org/UK_PV_timeseries_batch.nc
   solar_pv_metadata_filename: gs://solar-pv-nowcasting-data/PV/PVOutput.org/UK_PV_metadata.csv
-  gsp_zarr_path: gs://solar-pv-nowcasting-data/PV/PVOutput.org/PV/GSP/v0/pv_gsp.zarr
+  gsp_zarr_path: gs://solar-pv-nowcasting-data/PV/PVOutput.org/PV/GSP/v1/pv_gsp.zarr
   topographic_filename: gs://solar-pv-nowcasting-data/Topographic/europe_dem_1km_osgb.tif
 output_data:
   filepath: gs://solar-pv-nowcasting-data/prepared_ML_training_data/v6/
diff --git a/nowcasting_dataset/config/on_premises.yaml b/nowcasting_dataset/config/on_premises.yaml
index 984cc132..20cf9931 100644
--- a/nowcasting_dataset/config/on_premises.yaml
+++ b/nowcasting_dataset/config/on_premises.yaml
@@ -7,7 +7,7 @@ input_data:
   solar_pv_path:
   solar_pv_data_filename: /storage/data/ocf/solar_pv_nowcasting/nowcasting_dataset_pipeline/raw/PV/PVOutput.org/UK_PV_timeseries_batch.nc
   solar_pv_metadata_filename: /storage/data/ocf/solar_pv_nowcasting/nowcasting_dataset_pipeline/raw/PV/PVOutput.org/UK_PV_metadata.csv
-  gsp_zarr_path: /storage/data/ocf/solar_pv_nowcasting/nowcasting_dataset_pipeline/raw/PV/GSP/v0/pv_gsp.zarr
+  gsp_zarr_path: /storage/data/ocf/solar_pv_nowcasting/nowcasting_dataset_pipeline/raw/PV/GSP/v1/pv_gsp.zarr
 output_data:
   filepath: /storage/data/ocf/solar_pv_nowcasting/nowcasting_dataset_pipeline/prepared_ML_training_data/v7/
 process:
diff --git a/nowcasting_dataset/data_sources/gsp/gsp_data_source.py b/nowcasting_dataset/data_sources/gsp/gsp_data_source.py
index c62a01ae..6b89e6c0 100644
--- a/nowcasting_dataset/data_sources/gsp/gsp_data_source.py
+++ b/nowcasting_dataset/data_sources/gsp/gsp_data_source.py
@@ -58,6 +58,8 @@ class GSPDataSource(ImageDataSource):
     get_center: bool = True
     # the maximum number of gsp's to be loaded for data sample
     n_gsp_per_example: int = DEFAULT_N_GSP_PER_EXAMPLE
+    # scale from zero to one
+    do_scale_0_to_1: bool = False
 
     def __post_init__(self, image_size_pixels: int, meters_per_pixel: int):
         """
@@ -96,7 +98,8 @@ def load(self):
         )
 
         # scale from 0 to 1
-        self.gsp_power = scale_to_0_to_1(self.gsp_power)
+        if self.do_scale_0_to_1:
+            self.gsp_power = scale_to_0_to_1(self.gsp_power)
 
         logger.debug(f"There are {len(self.gsp_power.columns)} GSP")
 
@@ -389,7 +392,16 @@ def load_solar_gsp_data(
     # Open data - it may be quicker to open byte file first, but decided just to keep it like this at the moment
     gsp_power = xr.open_dataset(filename, engine="zarr")
     gsp_power = gsp_power.sel(datetime_gmt=slice(start_dt, end_dt))
+
+    # only take generation data
+    gsp_power = gsp_power.generation_mw
+
+    # make dataframe with index datetime_gmt and columns og gsp_id
     gsp_power_df = gsp_power.to_dataframe()
+    gsp_power_df.reset_index(inplace=True)
+    gsp_power_df = gsp_power_df.pivot(
+        index="datetime_gmt", columns="gsp_id", values="generation_mw"
+    )
 
     # Save memory
     del gsp_power
diff --git a/nowcasting_dataset/data_sources/gsp/pvlive.py b/nowcasting_dataset/data_sources/gsp/pvlive.py
index 112d2f61..d68ba519 100644
--- a/nowcasting_dataset/data_sources/gsp/pvlive.py
+++ b/nowcasting_dataset/data_sources/gsp/pvlive.py
@@ -3,6 +3,10 @@
 import logging
 import pandas as pd
 from pvlive_api import PVLive
+from typing import Optional
+import pytz
+from tqdm import tqdm
+from concurrent import futures
 
 from nowcasting_dataset.data_sources.gsp.eso import get_list_of_gsp_ids
 
@@ -12,7 +16,7 @@
 
 
 def load_pv_gsp_raw_data_from_pvlive(
-    start: datetime, end: datetime, number_of_gsp: int = None
+    start: datetime, end: datetime, number_of_gsp: int = None, normalize_data: bool = True
 ) -> pd.DataFrame:
     """
     Load raw pv gsp data from pvlive. Note that each gsp is loaded separately. Also the data is loaded in 30 day chunks.
@@ -21,6 +25,7 @@ def load_pv_gsp_raw_data_from_pvlive(
         start: the start date for gsp data to load
         end: the end date for gsp data to load
         number_of_gsp: The number of gsp to load. Note that on 2021-09-01 there were 338 to load.
+        normalize_data: Option to normalize the generation according to installed capacity
 
     Returns: Data frame of time series of gsp data. Shows PV data for each GSP from {start} to {end}
 
@@ -38,46 +43,59 @@ def load_pv_gsp_raw_data_from_pvlive(
     gsp_data_df = []
     logger.debug(f"Will be getting data for {len(gsp_ids)} gsp ids")
     # loop over gsp ids
-    for gsp_id in gsp_ids:
-
-        one_gsp_data_df = []
-
-        # set the first chunk start and end times
-        start_chunk = first_start_chunk
-        end_chunk = first_end_chunk
-
-        # loop over 30 days chunks (nice to see progress instead of waiting a long time for one command - this might
-        # not be the fastest)
-        while start_chunk <= end:
-            logger.debug(f"Getting data for gsp id {gsp_id} from {start_chunk} to {end_chunk}")
-
-            one_gsp_data_df.append(
-                pvl.between(
+    # limit the total number of concurrent tasks to be 4, so that we don't hit the pvlive api too much
+    future_tasks = []
+    with futures.ThreadPoolExecutor(max_workers=4) as executor:
+        for gsp_id in gsp_ids:
+
+            # set the first chunk start and end times
+            start_chunk = first_start_chunk
+            end_chunk = first_end_chunk
+
+            # loop over 30 days chunks (nice to see progress instead of waiting a long time for one command - this might
+            # not be the fastest)
+            while start_chunk <= end:
+                logger.debug(f"Getting data for gsp id {gsp_id} from {start_chunk} to {end_chunk}")
+
+                task = executor.submit(
+                    pvl.between,
                     start=start_chunk,
                     end=end_chunk,
                     entity_type="gsp",
                     entity_id=gsp_id,
-                    extra_fields="",
+                    extra_fields="installedcapacity_mwp",
                     dataframe=True,
                 )
-            )
 
-            # add 30 days to the chunk, to get the next chunk
-            start_chunk = start_chunk + CHUNK_DURATION
-            end_chunk = end_chunk + CHUNK_DURATION
+                future_tasks.append(task)
+
+                # add 30 days to the chunk, to get the next chunk
+                start_chunk = start_chunk + CHUNK_DURATION
+                end_chunk = end_chunk + CHUNK_DURATION
 
-            if end_chunk > end:
-                end_chunk = end
+                if end_chunk > end:
+                    end_chunk = end
 
-        # join together one gsp data, and sort
-        one_gsp_data_df = pd.concat(one_gsp_data_df)
-        one_gsp_data_df = one_gsp_data_df.sort_values(by=["gsp_id", "datetime_gmt"])
+        logger.debug(f"Getting results")
+        # Collect results from each thread.
+        for task in tqdm(future_tasks):
+            one_chunk_one_gsp_gsp_data_df = task.result()
 
-        # append to longer list
-        gsp_data_df.append(one_gsp_data_df)
+            if normalize_data:
+                one_chunk_one_gsp_gsp_data_df["generation_mw"] = (
+                    one_chunk_one_gsp_gsp_data_df["generation_mw"]
+                    / one_chunk_one_gsp_gsp_data_df["installedcapacity_mwp"]
+                )
 
+            # append to longer list
+            gsp_data_df.append(one_chunk_one_gsp_gsp_data_df)
+
+    # join together gsp data
     gsp_data_df = pd.concat(gsp_data_df)
 
+    # sort
+    gsp_data_df = gsp_data_df.sort_values(by=["gsp_id", "datetime_gmt"])
+
     # remove any extra data loaded
     gsp_data_df = gsp_data_df[gsp_data_df["datetime_gmt"] <= end]
 
@@ -88,3 +106,49 @@ def load_pv_gsp_raw_data_from_pvlive(
     gsp_data_df["datetime_gmt"] = gsp_data_df["datetime_gmt"].dt.tz_localize(None)
 
     return gsp_data_df
+
+
+def get_installed_capacity(
+    start: Optional[datetime] = datetime(2021, 1, 1, tzinfo=pytz.utc),
+    maximum_number_of_gsp: Optional[int] = None,
+) -> pd.Series:
+    """
+    Get the installed capacity of each gsp
+
+    This can take ~30 seconds for getting the full list
+
+    Args:
+        start: optional datetime when the installed cpapcity is collected
+        maximum_number_of_gsp: Truncate list of GSPs to be no larger than this number of GSPs.
+            Set to None to disable truncation.
+
+    Returns: pd.Series of installed capacity indexed by gsp_id
+
+    """
+    logger.debug(f"Getting all installed capacity at {start}")
+
+    # get a lit of gsp ids
+    gsp_ids = get_list_of_gsp_ids(maximum_number_of_gsp=maximum_number_of_gsp)
+
+    # setup pv Live class, although here we are getting historic data
+    pvl = PVLive()
+
+    # loop over gsp_id to get installed capacity
+    data = []
+    for gsp_id in gsp_ids:
+        d = pvl.at_time(
+            start,
+            entity_type="gsp",
+            extra_fields="installedcapacity_mwp",
+            dataframe=True,
+            entity_id=gsp_id,
+        )
+        data.append(d)
+
+    # join data together
+    data_df = pd.concat(data)
+
+    # set gsp_id as index
+    data_df.set_index("gsp_id", inplace=True)
+
+    return data_df["installedcapacity_mwp"]
diff --git a/nowcasting_dataset/dataset/split/__init__.py b/nowcasting_dataset/dataset/split/__init__.py
new file mode 100644
index 00000000..c7eb89d1
--- /dev/null
+++ b/nowcasting_dataset/dataset/split/__init__.py
@@ -0,0 +1 @@
+""" split functions """
diff --git a/scripts/get_raw_pv_gsp_data.py b/scripts/get_raw_pv_gsp_data.py
index 5406d053..32b56c28 100755
--- a/scripts/get_raw_pv_gsp_data.py
+++ b/scripts/get_raw_pv_gsp_data.py
@@ -11,6 +11,7 @@
 import yaml
 import os
 import numcodecs
+import xarray as xr
 
 from nowcasting_dataset.data_sources.gsp.pvlive import load_pv_gsp_raw_data_from_pvlive
 from pathlib import Path
@@ -36,11 +37,21 @@
 data_df = load_pv_gsp_raw_data_from_pvlive(start=start, end=end)
 
 # pivot to index as datetime_gmt, and columns as gsp_id
-data_df = data_df.pivot(index="datetime_gmt", columns="gsp_id", values="generation_mw")
-data_df.columns = [str(col) for col in data_df.columns]
+data_generation = data_df.pivot(index="datetime_gmt", columns="gsp_id", values="generation_mw")
+data_generation.columns = [str(col) for col in data_generation.columns]
+data_generation_xarray = xr.DataArray(
+    data_generation, name="generation_mw", dims=["datetime_gmt", "gsp_id"]
+)
 
-# change to xarray
-data_xarray = data_df.to_xarray()
+data_capacity = data_df.pivot(
+    index="datetime_gmt", columns="gsp_id", values="installedcapacity_mwp"
+)
+data_capacity.columns = [str(col) for col in data_capacity.columns]
+data_capacity_xarray = xr.DataArray(
+    data_capacity, name="installedcapacity_mwp", dims=["datetime_gmt", "gsp_id"]
+)
+
+data_xarray = xr.merge([data_generation_xarray, data_capacity_xarray])
 
 # save config to file
 with open(os.path.join(LOCAL_TEMP_PATH, "configuration.yaml"), "w+") as f:
diff --git a/tests/data/gsp/test.zarr/.zmetadata b/tests/data/gsp/test.zarr/.zmetadata
index a6cf4ed1..ab697b80 100644
--- a/tests/data/gsp/test.zarr/.zmetadata
+++ b/tests/data/gsp/test.zarr/.zmetadata
@@ -4,384 +4,9 @@
         ".zgroup": {
             "zarr_format": 2
         },
-        "1/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "1/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "10/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "10/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "100/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "100/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "101/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "101/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "102/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "102/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "103/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "103/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "104/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "104/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "105/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "105/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "106/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "106/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "107/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "107/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "108/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "108/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "109/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "109/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "11/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "11/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "110/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "110/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "111/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "111/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
-        },
-        "112/.zarray": {
+        "datetime_gmt/.zarray": {
             "chunks": [
-                145
+                49
             ],
             "compressor": {
                 "blocksize": 0,
@@ -390,53 +15,31 @@
                 "id": "blosc",
                 "shuffle": 1
             },
-            "dtype": "<f8",
-            "fill_value": "NaN",
+            "dtype": "<i8",
+            "fill_value": null,
             "filters": null,
             "order": "C",
             "shape": [
-                145
+                49
             ],
             "zarr_format": 2
         },
-        "112/.zattrs": {
+        "datetime_gmt/.zattrs": {
             "_ARRAY_DIMENSIONS": [
                 "datetime_gmt"
-            ]
-        },
-        "113/.zarray": {
-            "chunks": [
-                145
             ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<f8",
-            "fill_value": "NaN",
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "113/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ]
+            "calendar": "proleptic_gregorian",
+            "units": "minutes since 2019-01-01"
         },
-        "114/.zarray": {
+        "generation_mw/.zarray": {
             "chunks": [
-                145
+                49,
+                21
             ],
             "compressor": {
                 "blocksize": 0,
                 "clevel": 5,
-                "cname": "lz4",
+                "cname": "zstd",
                 "id": "blosc",
                 "shuffle": 1
             },
@@ -445,18 +48,20 @@
             "filters": null,
             "order": "C",
             "shape": [
-                145
+                49,
+                21
             ],
             "zarr_format": 2
         },
-        "114/.zattrs": {
+        "generation_mw/.zattrs": {
             "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
+                "datetime_gmt",
+                "gsp_id"
             ]
         },
-        "115/.zarray": {
+        "gsp_id/.zarray": {
             "chunks": [
-                145
+                21
             ],
             "compressor": {
                 "blocksize": 0,
@@ -465,28 +70,29 @@
                 "id": "blosc",
                 "shuffle": 1
             },
-            "dtype": "<f8",
-            "fill_value": "NaN",
+            "dtype": "<U2",
+            "fill_value": null,
             "filters": null,
             "order": "C",
             "shape": [
-                145
+                21
             ],
             "zarr_format": 2
         },
-        "115/.zattrs": {
+        "gsp_id/.zattrs": {
             "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
+                "gsp_id"
             ]
         },
-        "116/.zarray": {
+        "installedcapacity_mwp/.zarray": {
             "chunks": [
-                145
+                49,
+                21
             ],
             "compressor": {
                 "blocksize": 0,
                 "clevel": 5,
-                "cname": "lz4",
+                "cname": "zstd",
                 "id": "blosc",
                 "shuffle": 1
             },
@@ -495,42 +101,17 @@
             "filters": null,
             "order": "C",
             "shape": [
-                145
+                49,
+                21
             ],
             "zarr_format": 2
         },
-        "116/.zattrs": {
+        "installedcapacity_mwp/.zattrs": {
             "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
+                "datetime_gmt",
+                "gsp_id"
             ]
-        },
-        "datetime_gmt/.zarray": {
-            "chunks": [
-                145
-            ],
-            "compressor": {
-                "blocksize": 0,
-                "clevel": 5,
-                "cname": "lz4",
-                "id": "blosc",
-                "shuffle": 1
-            },
-            "dtype": "<i8",
-            "fill_value": null,
-            "filters": null,
-            "order": "C",
-            "shape": [
-                145
-            ],
-            "zarr_format": 2
-        },
-        "datetime_gmt/.zattrs": {
-            "_ARRAY_DIMENSIONS": [
-                "datetime_gmt"
-            ],
-            "calendar": "proleptic_gregorian",
-            "units": "minutes since 2019-01-01 00:00:00"
         }
     },
     "zarr_consolidated_format": 1
-}
\ No newline at end of file
+}
diff --git a/tests/data/gsp/test.zarr/1/.zattrs b/tests/data/gsp/test.zarr/1/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/1/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/1/0 b/tests/data/gsp/test.zarr/1/0
deleted file mode 100644
index 012ae98b..00000000
Binary files a/tests/data/gsp/test.zarr/1/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/10/.zarray b/tests/data/gsp/test.zarr/10/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/10/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/10/0 b/tests/data/gsp/test.zarr/10/0
deleted file mode 100644
index 0381d53e..00000000
Binary files a/tests/data/gsp/test.zarr/10/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/100/.zattrs b/tests/data/gsp/test.zarr/100/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/100/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/100/0 b/tests/data/gsp/test.zarr/100/0
deleted file mode 100644
index ede126e6..00000000
Binary files a/tests/data/gsp/test.zarr/100/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/101/.zattrs b/tests/data/gsp/test.zarr/101/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/101/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/101/0 b/tests/data/gsp/test.zarr/101/0
deleted file mode 100644
index b5a8c9ab..00000000
Binary files a/tests/data/gsp/test.zarr/101/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/102/.zarray b/tests/data/gsp/test.zarr/102/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/102/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/102/.zattrs b/tests/data/gsp/test.zarr/102/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/102/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/102/0 b/tests/data/gsp/test.zarr/102/0
deleted file mode 100644
index 05736fe3..00000000
Binary files a/tests/data/gsp/test.zarr/102/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/103/.zarray b/tests/data/gsp/test.zarr/103/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/103/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/103/.zattrs b/tests/data/gsp/test.zarr/103/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/103/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/103/0 b/tests/data/gsp/test.zarr/103/0
deleted file mode 100644
index 99b5249e..00000000
Binary files a/tests/data/gsp/test.zarr/103/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/104/.zarray b/tests/data/gsp/test.zarr/104/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/104/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/104/.zattrs b/tests/data/gsp/test.zarr/104/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/104/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/104/0 b/tests/data/gsp/test.zarr/104/0
deleted file mode 100644
index e9d530b5..00000000
Binary files a/tests/data/gsp/test.zarr/104/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/105/.zarray b/tests/data/gsp/test.zarr/105/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/105/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/105/.zattrs b/tests/data/gsp/test.zarr/105/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/105/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/105/0 b/tests/data/gsp/test.zarr/105/0
deleted file mode 100644
index 1f615b4e..00000000
Binary files a/tests/data/gsp/test.zarr/105/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/106/.zarray b/tests/data/gsp/test.zarr/106/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/106/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/106/.zattrs b/tests/data/gsp/test.zarr/106/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/106/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/106/0 b/tests/data/gsp/test.zarr/106/0
deleted file mode 100644
index a52b5879..00000000
Binary files a/tests/data/gsp/test.zarr/106/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/107/.zarray b/tests/data/gsp/test.zarr/107/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/107/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/107/.zattrs b/tests/data/gsp/test.zarr/107/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/107/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/107/0 b/tests/data/gsp/test.zarr/107/0
deleted file mode 100644
index 567aa02d..00000000
Binary files a/tests/data/gsp/test.zarr/107/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/108/.zarray b/tests/data/gsp/test.zarr/108/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/108/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/108/.zattrs b/tests/data/gsp/test.zarr/108/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/108/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/108/0 b/tests/data/gsp/test.zarr/108/0
deleted file mode 100644
index 70aee3c1..00000000
Binary files a/tests/data/gsp/test.zarr/108/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/109/.zarray b/tests/data/gsp/test.zarr/109/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/109/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/109/.zattrs b/tests/data/gsp/test.zarr/109/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/109/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/109/0 b/tests/data/gsp/test.zarr/109/0
deleted file mode 100644
index 241f3b94..00000000
Binary files a/tests/data/gsp/test.zarr/109/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/11/.zarray b/tests/data/gsp/test.zarr/11/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/11/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/11/.zattrs b/tests/data/gsp/test.zarr/11/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/11/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/11/0 b/tests/data/gsp/test.zarr/11/0
deleted file mode 100644
index ba63bb0b..00000000
Binary files a/tests/data/gsp/test.zarr/11/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/110/.zarray b/tests/data/gsp/test.zarr/110/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/110/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/110/.zattrs b/tests/data/gsp/test.zarr/110/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/110/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/110/0 b/tests/data/gsp/test.zarr/110/0
deleted file mode 100644
index 00e0d970..00000000
Binary files a/tests/data/gsp/test.zarr/110/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/111/.zarray b/tests/data/gsp/test.zarr/111/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/111/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/111/.zattrs b/tests/data/gsp/test.zarr/111/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/111/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/111/0 b/tests/data/gsp/test.zarr/111/0
deleted file mode 100644
index a4de7db5..00000000
Binary files a/tests/data/gsp/test.zarr/111/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/112/.zarray b/tests/data/gsp/test.zarr/112/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/112/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/112/.zattrs b/tests/data/gsp/test.zarr/112/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/112/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/112/0 b/tests/data/gsp/test.zarr/112/0
deleted file mode 100644
index 2a415efd..00000000
Binary files a/tests/data/gsp/test.zarr/112/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/113/.zarray b/tests/data/gsp/test.zarr/113/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/113/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/113/.zattrs b/tests/data/gsp/test.zarr/113/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/113/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/113/0 b/tests/data/gsp/test.zarr/113/0
deleted file mode 100644
index d7df7b80..00000000
Binary files a/tests/data/gsp/test.zarr/113/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/114/.zarray b/tests/data/gsp/test.zarr/114/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/114/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/114/.zattrs b/tests/data/gsp/test.zarr/114/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/114/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/114/0 b/tests/data/gsp/test.zarr/114/0
deleted file mode 100644
index 2a415efd..00000000
Binary files a/tests/data/gsp/test.zarr/114/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/115/.zarray b/tests/data/gsp/test.zarr/115/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/115/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/115/.zattrs b/tests/data/gsp/test.zarr/115/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/115/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/115/0 b/tests/data/gsp/test.zarr/115/0
deleted file mode 100644
index da5e79f1..00000000
Binary files a/tests/data/gsp/test.zarr/115/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/116/.zarray b/tests/data/gsp/test.zarr/116/.zarray
deleted file mode 100644
index 8fe50e27..00000000
--- a/tests/data/gsp/test.zarr/116/.zarray
+++ /dev/null
@@ -1,20 +0,0 @@
-{
-    "chunks": [
-        145
-    ],
-    "compressor": {
-        "blocksize": 0,
-        "clevel": 5,
-        "cname": "lz4",
-        "id": "blosc",
-        "shuffle": 1
-    },
-    "dtype": "<f8",
-    "fill_value": "NaN",
-    "filters": null,
-    "order": "C",
-    "shape": [
-        145
-    ],
-    "zarr_format": 2
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/116/.zattrs b/tests/data/gsp/test.zarr/116/.zattrs
deleted file mode 100644
index e4c12287..00000000
--- a/tests/data/gsp/test.zarr/116/.zattrs
+++ /dev/null
@@ -1,5 +0,0 @@
-{
-    "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
-    ]
-}
\ No newline at end of file
diff --git a/tests/data/gsp/test.zarr/116/0 b/tests/data/gsp/test.zarr/116/0
deleted file mode 100644
index e59842d8..00000000
Binary files a/tests/data/gsp/test.zarr/116/0 and /dev/null differ
diff --git a/tests/data/gsp/test.zarr/datetime_gmt/.zarray b/tests/data/gsp/test.zarr/datetime_gmt/.zarray
index 7f5ce911..44c9a184 100644
--- a/tests/data/gsp/test.zarr/datetime_gmt/.zarray
+++ b/tests/data/gsp/test.zarr/datetime_gmt/.zarray
@@ -1,6 +1,6 @@
 {
     "chunks": [
-        145
+        49
     ],
     "compressor": {
         "blocksize": 0,
@@ -14,7 +14,7 @@
     "filters": null,
     "order": "C",
     "shape": [
-        145
+        49
     ],
     "zarr_format": 2
-}
\ No newline at end of file
+}
diff --git a/tests/data/gsp/test.zarr/datetime_gmt/.zattrs b/tests/data/gsp/test.zarr/datetime_gmt/.zattrs
index 9487f1c5..e9976b75 100644
--- a/tests/data/gsp/test.zarr/datetime_gmt/.zattrs
+++ b/tests/data/gsp/test.zarr/datetime_gmt/.zattrs
@@ -3,5 +3,5 @@
         "datetime_gmt"
     ],
     "calendar": "proleptic_gregorian",
-    "units": "minutes since 2019-01-01 00:00:00"
-}
\ No newline at end of file
+    "units": "minutes since 2019-01-01"
+}
diff --git a/tests/data/gsp/test.zarr/datetime_gmt/0 b/tests/data/gsp/test.zarr/datetime_gmt/0
index 7e859e54..76b3c555 100644
Binary files a/tests/data/gsp/test.zarr/datetime_gmt/0 and b/tests/data/gsp/test.zarr/datetime_gmt/0 differ
diff --git a/tests/data/gsp/test.zarr/1/.zarray b/tests/data/gsp/test.zarr/generation_mw/.zarray
similarity index 78%
rename from tests/data/gsp/test.zarr/1/.zarray
rename to tests/data/gsp/test.zarr/generation_mw/.zarray
index 8fe50e27..e133606f 100644
--- a/tests/data/gsp/test.zarr/1/.zarray
+++ b/tests/data/gsp/test.zarr/generation_mw/.zarray
@@ -1,11 +1,12 @@
 {
     "chunks": [
-        145
+        49,
+        21
     ],
     "compressor": {
         "blocksize": 0,
         "clevel": 5,
-        "cname": "lz4",
+        "cname": "zstd",
         "id": "blosc",
         "shuffle": 1
     },
@@ -14,7 +15,8 @@
     "filters": null,
     "order": "C",
     "shape": [
-        145
+        49,
+        21
     ],
     "zarr_format": 2
-}
\ No newline at end of file
+}
diff --git a/tests/data/gsp/test.zarr/generation_mw/.zattrs b/tests/data/gsp/test.zarr/generation_mw/.zattrs
new file mode 100644
index 00000000..758489d4
--- /dev/null
+++ b/tests/data/gsp/test.zarr/generation_mw/.zattrs
@@ -0,0 +1,6 @@
+{
+    "_ARRAY_DIMENSIONS": [
+        "datetime_gmt",
+        "gsp_id"
+    ]
+}
diff --git a/tests/data/gsp/test.zarr/generation_mw/0.0 b/tests/data/gsp/test.zarr/generation_mw/0.0
new file mode 100644
index 00000000..28971bcc
Binary files /dev/null and b/tests/data/gsp/test.zarr/generation_mw/0.0 differ
diff --git a/tests/data/gsp/test.zarr/101/.zarray b/tests/data/gsp/test.zarr/gsp_id/.zarray
similarity index 77%
rename from tests/data/gsp/test.zarr/101/.zarray
rename to tests/data/gsp/test.zarr/gsp_id/.zarray
index 8fe50e27..7917cc83 100644
--- a/tests/data/gsp/test.zarr/101/.zarray
+++ b/tests/data/gsp/test.zarr/gsp_id/.zarray
@@ -1,6 +1,6 @@
 {
     "chunks": [
-        145
+        21
     ],
     "compressor": {
         "blocksize": 0,
@@ -9,12 +9,12 @@
         "id": "blosc",
         "shuffle": 1
     },
-    "dtype": "<f8",
-    "fill_value": "NaN",
+    "dtype": "<U2",
+    "fill_value": null,
     "filters": null,
     "order": "C",
     "shape": [
-        145
+        21
     ],
     "zarr_format": 2
-}
\ No newline at end of file
+}
diff --git a/tests/data/gsp/test.zarr/10/.zattrs b/tests/data/gsp/test.zarr/gsp_id/.zattrs
similarity index 59%
rename from tests/data/gsp/test.zarr/10/.zattrs
rename to tests/data/gsp/test.zarr/gsp_id/.zattrs
index e4c12287..6de1b9d6 100644
--- a/tests/data/gsp/test.zarr/10/.zattrs
+++ b/tests/data/gsp/test.zarr/gsp_id/.zattrs
@@ -1,5 +1,5 @@
 {
     "_ARRAY_DIMENSIONS": [
-        "datetime_gmt"
+        "gsp_id"
     ]
-}
\ No newline at end of file
+}
diff --git a/tests/data/gsp/test.zarr/gsp_id/0 b/tests/data/gsp/test.zarr/gsp_id/0
new file mode 100644
index 00000000..042a70a9
Binary files /dev/null and b/tests/data/gsp/test.zarr/gsp_id/0 differ
diff --git a/tests/data/gsp/test.zarr/100/.zarray b/tests/data/gsp/test.zarr/installedcapacity_mwp/.zarray
similarity index 78%
rename from tests/data/gsp/test.zarr/100/.zarray
rename to tests/data/gsp/test.zarr/installedcapacity_mwp/.zarray
index 8fe50e27..e133606f 100644
--- a/tests/data/gsp/test.zarr/100/.zarray
+++ b/tests/data/gsp/test.zarr/installedcapacity_mwp/.zarray
@@ -1,11 +1,12 @@
 {
     "chunks": [
-        145
+        49,
+        21
     ],
     "compressor": {
         "blocksize": 0,
         "clevel": 5,
-        "cname": "lz4",
+        "cname": "zstd",
         "id": "blosc",
         "shuffle": 1
     },
@@ -14,7 +15,8 @@
     "filters": null,
     "order": "C",
     "shape": [
-        145
+        49,
+        21
     ],
     "zarr_format": 2
-}
\ No newline at end of file
+}
diff --git a/tests/data/gsp/test.zarr/installedcapacity_mwp/.zattrs b/tests/data/gsp/test.zarr/installedcapacity_mwp/.zattrs
new file mode 100644
index 00000000..758489d4
--- /dev/null
+++ b/tests/data/gsp/test.zarr/installedcapacity_mwp/.zattrs
@@ -0,0 +1,6 @@
+{
+    "_ARRAY_DIMENSIONS": [
+        "datetime_gmt",
+        "gsp_id"
+    ]
+}
diff --git a/tests/data/gsp/test.zarr/installedcapacity_mwp/0.0 b/tests/data/gsp/test.zarr/installedcapacity_mwp/0.0
new file mode 100644
index 00000000..73480d16
Binary files /dev/null and b/tests/data/gsp/test.zarr/installedcapacity_mwp/0.0 differ
diff --git a/tests/data_sources/get_test_data.py b/tests/data_sources/get_test_data.py
index 2369b786..73708b7e 100644
--- a/tests/data_sources/get_test_data.py
+++ b/tests/data_sources/get_test_data.py
@@ -6,6 +6,7 @@
 from pathlib import Path
 import pandas as pd
 import os
+import numcodecs
 import nowcasting_dataset
 from nowcasting_dataset.data_sources.nwp_data_source import open_nwp, NWP_VARIABLE_NAMES
 from nowcasting_dataset.data_sources.gsp.gsp_data_source import GSPDataSource
@@ -79,27 +80,19 @@
 nwp_data.to_zarr(f"{local_path}/tests/data/nwp_data/test.zarr")
 
 # ### GSP data
+filename = "gs://solar-pv-nowcasting-data/PV/GSP/v1/pv_gsp.zarr"
 
-gsp = GSPDataSource(
-    filename="gs://solar-pv-nowcasting-data/PV/GSP/v0/pv_gsp.zarr",
-    start_dt=start_dt,
-    end_dt=end_dt,
-    history_minutes=30,
-    forecast_minutes=60,
-    convert_to_numpy=True,
-    image_size_pixels=64,
-    meters_per_pixel=2000,
-)
-
+gsp_power = xr.open_dataset(filename, engine="zarr")
+gsp_power = gsp_power.sel(datetime_gmt=slice(start_dt, end_dt))
+gsp_power = gsp_power.sel(gsp_id=slice(gsp_power.gsp_id[0], gsp_power.gsp_id[20]))
 
-gsp.gsp_power.columns = [str(col) for col in gsp.gsp_power.columns]
+gsp_power["gsp_id"] = gsp_power.gsp_id.astype("str")
 
-# select limited data
-data = gsp.gsp_power
-data = data[data.columns[0:20]]
+encoding = {
+    var: {"compressor": numcodecs.Blosc(cname="zstd", clevel=5)} for var in gsp_power.data_vars
+}
 
-data_xarray = data.to_xarray()
-data_xarray.to_zarr(f"{local_path}/tests/data/gsp/test.zarr", mode="w")
+gsp_power.to_zarr(f"{local_path}/tests/data/gsp/test.zarr", mode="w", encoding=encoding)
 
 
 # ### satellite
diff --git a/tests/data_sources/gsp/test_gsp_metadata.py b/tests/data_sources/gsp/test_gsp_metadata.py
index 9b4ad2f7..9b4e5cae 100644
--- a/tests/data_sources/gsp/test_gsp_metadata.py
+++ b/tests/data_sources/gsp/test_gsp_metadata.py
@@ -1,14 +1,10 @@
-from datetime import datetime
-
 import geopandas as gpd
 import pandas as pd
-import pytz
 
 from nowcasting_dataset.data_sources.gsp.eso import (
     get_gsp_metadata_from_eso,
     get_gsp_shape_from_eso,
 )
-from nowcasting_dataset.data_sources.gsp.pvlive import load_pv_gsp_raw_data_from_pvlive
 
 
 def test_get_gsp_metadata_from_eso():
@@ -73,52 +69,3 @@ def test_get_pv_gsp_shape_from_eso():
     assert "RegionID" in gsp_shapes.columns
     assert "RegionName" in gsp_shapes.columns
     assert "geometry" in gsp_shapes.columns
-
-
-def test_load_gsp_raw_data_from_pvlive_one_gsp_one_day():
-    """
-    Test that one gsp system data can be loaded, just for one day
-    """
-
-    start = datetime(2019, 1, 1, tzinfo=pytz.utc)
-    end = datetime(2019, 1, 2, tzinfo=pytz.utc)
-
-    gsp_pv_df = load_pv_gsp_raw_data_from_pvlive(start=start, end=end, number_of_gsp=1)
-
-    assert isinstance(gsp_pv_df, pd.DataFrame)
-    assert len(gsp_pv_df) == (48 + 1)
-    assert "datetime_gmt" in gsp_pv_df.columns
-    assert "generation_mw" in gsp_pv_df.columns
-
-
-def test_load_gsp_raw_data_from_pvlive_one_gsp():
-    """
-    Test that one gsp system data can be loaded
-    """
-
-    start = datetime(2019, 1, 1, tzinfo=pytz.utc)
-    end = datetime(2019, 3, 1, tzinfo=pytz.utc)
-
-    gsp_pv_df = load_pv_gsp_raw_data_from_pvlive(start=start, end=end, number_of_gsp=1)
-
-    assert isinstance(gsp_pv_df, pd.DataFrame)
-    assert len(gsp_pv_df) == (48 * 59 + 1)
-    # 30 days in january, 29 days in february, plus one for the first timestamp in march
-    assert "datetime_gmt" in gsp_pv_df.columns
-    assert "generation_mw" in gsp_pv_df.columns
-
-
-def test_load_gsp_raw_data_from_pvlive_many_gsp():
-    """
-    Test that one gsp system data can be loaded
-    """
-
-    start = datetime(2019, 1, 1, tzinfo=pytz.utc)
-    end = datetime(2019, 1, 2, tzinfo=pytz.utc)
-
-    gsp_pv_df = load_pv_gsp_raw_data_from_pvlive(start=start, end=end, number_of_gsp=10)
-
-    assert isinstance(gsp_pv_df, pd.DataFrame)
-    assert len(gsp_pv_df) == (48 + 1) * 10
-    assert "datetime_gmt" in gsp_pv_df.columns
-    assert "generation_mw" in gsp_pv_df.columns
diff --git a/tests/data_sources/gsp/test_gsp_pvlive.py b/tests/data_sources/gsp/test_gsp_pvlive.py
new file mode 100644
index 00000000..30e37d52
--- /dev/null
+++ b/tests/data_sources/gsp/test_gsp_pvlive.py
@@ -0,0 +1,88 @@
+from datetime import datetime
+
+import pandas as pd
+import pytz
+
+from nowcasting_dataset.data_sources.gsp.pvlive import (
+    load_pv_gsp_raw_data_from_pvlive,
+    get_installed_capacity,
+)
+
+
+def test_load_gsp_raw_data_from_pvlive_one_gsp_one_day():
+    """
+    Test that one gsp system data can be loaded, just for one day
+    """
+
+    start = datetime(2019, 1, 1, tzinfo=pytz.utc)
+    end = datetime(2019, 1, 2, tzinfo=pytz.utc)
+
+    gsp_pv_df = load_pv_gsp_raw_data_from_pvlive(start=start, end=end, number_of_gsp=1)
+
+    assert isinstance(gsp_pv_df, pd.DataFrame)
+    assert len(gsp_pv_df) == (48 + 1)
+    assert "datetime_gmt" in gsp_pv_df.columns
+    assert "generation_mw" in gsp_pv_df.columns
+
+
+def test_load_gsp_raw_data_from_pvlive_one_gsp_one_day_not_normalised():
+    """
+    Test that one gsp system data can be loaded, just for one day, and is normalized correctly
+    """
+
+    # pick a summer day
+    start = datetime(2019, 6, 21, tzinfo=pytz.utc)
+    end = datetime(2019, 6, 22, tzinfo=pytz.utc)
+
+    gsp_pv_df = load_pv_gsp_raw_data_from_pvlive(
+        start=start, end=end, number_of_gsp=1, normalize_data=False
+    )
+    assert gsp_pv_df["generation_mw"].max() > 1
+
+    gsp_pv_df = load_pv_gsp_raw_data_from_pvlive(
+        start=start, end=end, number_of_gsp=1, normalize_data=True
+    )
+    assert gsp_pv_df["generation_mw"].max() <= 1
+
+
+def test_load_gsp_raw_data_from_pvlive_one_gsp():
+    """a
+    Test that one gsp system data can be loaded
+    """
+
+    start = datetime(2019, 1, 1, tzinfo=pytz.utc)
+    end = datetime(2019, 3, 1, tzinfo=pytz.utc)
+
+    gsp_pv_df = load_pv_gsp_raw_data_from_pvlive(start=start, end=end, number_of_gsp=1)
+
+    assert isinstance(gsp_pv_df, pd.DataFrame)
+    assert len(gsp_pv_df) == (48 * 59 + 1)
+    # 30 days in january, 29 days in february, plus one for the first timestamp in march
+    assert "datetime_gmt" in gsp_pv_df.columns
+    assert "generation_mw" in gsp_pv_df.columns
+
+
+def test_load_gsp_raw_data_from_pvlive_many_gsp():
+    """
+    Test that one gsp system data can be loaded
+    """
+
+    start = datetime(2019, 1, 1, tzinfo=pytz.utc)
+    end = datetime(2019, 1, 2, tzinfo=pytz.utc)
+
+    gsp_pv_df = load_pv_gsp_raw_data_from_pvlive(start=start, end=end, number_of_gsp=10)
+
+    assert isinstance(gsp_pv_df, pd.DataFrame)
+    assert len(gsp_pv_df) == (48 + 1) * 10
+    assert "datetime_gmt" in gsp_pv_df.columns
+    assert "generation_mw" in gsp_pv_df.columns
+
+
+def test_get_installed_capacity():
+
+    installed_capacity = get_installed_capacity(maximum_number_of_gsp=10)
+
+    assert len(installed_capacity) == 10
+    assert "installedcapacity_mwp" == installed_capacity.name
+    assert installed_capacity.iloc[0] == 342.02623
+    assert installed_capacity.iloc[9] == 308.00432