# Combined Dataset Ideas

This notebook contains several ideas for implementing a combined dataset in GluonTS.

In [1]:
from gift_eval.data import Dataset

import os
from dotenv import load_dotenv
from pathlib import Path

load_dotenv()

gift_eval_path = os.getenv("GIFT_EVAL")

gift_eval_path = Path(gift_eval_path)

dataset_names = []
for dataset_dir in gift_eval_path.iterdir():
    if dataset_dir.name.startswith(".") or not dataset_dir.is_dir():
        continue

    freq_dirs = [d for d in dataset_dir.iterdir() if d.is_dir()]
    if not freq_dirs:
        dataset_names.append(dataset_dir.name)

    for freq_dir in freq_dirs:
        dataset_names.append(f"{dataset_dir.name}/{freq_dir.name}")

print("Available datasets in GIFT_EVAL:")
for name in sorted(dataset_names):
    print(f"- {name}")

  from .autonotebook import tqdm as notebook_tqdm


Available datasets in GIFT_EVAL:
- LOOP_SEATTLE/5T
- LOOP_SEATTLE/D
- LOOP_SEATTLE/H
- M_DENSE/D
- M_DENSE/H
- SZ_TAXI/15T
- SZ_TAXI/H
- bitbrains_fast_storage/5T
- bitbrains_fast_storage/H
- bitbrains_rnd/5T
- bitbrains_rnd/H
- bizitobs_application
- bizitobs_l2c/5T
- bizitobs_l2c/H
- bizitobs_service
- car_parts_with_missing
- covid_deaths
- electricity/15T
- electricity/D
- electricity/H
- electricity/W
- ett1/15T
- ett1/D
- ett1/H
- ett1/W
- ett2/15T
- ett2/D
- ett2/H
- ett2/W
- hierarchical_sales/D
- hierarchical_sales/W
- hospital
- jena_weather/10T
- jena_weather/D
- jena_weather/H
- kdd_cup_2018_with_missing/D
- kdd_cup_2018_with_missing/H
- m4_daily
- m4_hourly
- m4_monthly
- m4_quarterly
- m4_weekly
- m4_yearly
- restaurant
- saugeenday/D
- saugeenday/M
- saugeenday/W
- solar/10T
- solar/D
- solar/H
- solar/W
- temperature_rain_with_missing
- us_births/D
- us_births/M
- us_births/W


In [2]:
import random

n = 8

names = random.sample(dataset_names, n)
names

['solar/W',
 'bizitobs_application',
 'ett2/15T',
 'm4_daily',
 'bitbrains_rnd/H',
 'hospital',
 'hierarchical_sales/D',
 'saugeenday/W']