In [34]:
import os
import tensorflow as tf
from tqdm import tqdm
from datasets import Dataset

In [35]:
def convert_tf_dataset(tf_dir: str, torch_dir: str):
    tf_dataset = tf.data.Dataset.load(tf_dir)
    torch_dataset = []
    # print(type(tf_dataset))
    for example in tf_dataset:
        torch_example = {
            "input_text": example["inputs_pretokenized"].numpy().decode("utf-8"),
            "target_text": example["targets_pretokenized"].numpy().decode("utf-8"),
            "task_name": example["_task_name"].numpy().decode("utf-8"),
            "task_source": example["_task_source"].numpy().decode("utf-8"),
            "template_idx": example["_template_idx"].numpy(),
        }
        torch_dataset.append(torch_example)
    torch_dataset = Dataset.from_list(torch_dataset)
    torch_dataset.save_to_disk(torch_dir)

def convert_subset(tf_root_dir: str, torch_root_dir: str):
    tf_datasets = os.listdir(tf_root_dir)
    for tf_dataset in tqdm(tf_datasets):
        tf_dir = os.path.join(tf_root_dir, tf_dataset)
        torch_dir = os.path.join(torch_root_dir, tf_dataset)
        convert_tf_dataset(tf_dir, torch_dir)

In [37]:
convert_subset("./subsets/flan2021", "./pytorch_subsets/flan2021")

  0%|          | 0/355 [00:00<?, ?it/s]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  0%|          | 1/355 [00:02<13:52,  2.35s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  1%|          | 2/355 [00:04<13:28,  2.29s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  1%|          | 3/355 [00:06<13:18,  2.27s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  1%|          | 4/355 [00:09<13:52,  2.37s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  1%|▏         | 5/355 [00:11<13:24,  2.30s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  2%|▏         | 6/355 [00:13<13:01,  2.24s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  2%|▏         | 7/355 [00:16<13:10,  2.27s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  2%|▏         | 8/355 [00:18<12:58,  2.24s/it]

Saving the dataset (0/1 shards):   0%|          | 0/3130 [00:00<?, ? examples/s]

  3%|▎         | 9/355 [00:19<10:23,  1.80s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  3%|▎         | 10/355 [00:21<11:15,  1.96s/it]

Saving the dataset (0/1 shards):   0%|          | 0/3460 [00:00<?, ? examples/s]

  3%|▎         | 11/355 [00:22<09:14,  1.61s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  3%|▎         | 12/355 [00:24<09:57,  1.74s/it]

Saving the dataset (0/1 shards):   0%|          | 0/500 [00:00<?, ? examples/s]

  4%|▎         | 13/355 [00:24<07:13,  1.27s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  4%|▍         | 14/355 [00:26<08:31,  1.50s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  4%|▍         | 15/355 [00:28<10:00,  1.77s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  5%|▍         | 16/355 [00:31<10:45,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  5%|▍         | 17/355 [00:34<13:32,  2.41s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  5%|▌         | 18/355 [00:36<13:24,  2.39s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  5%|▌         | 19/355 [00:39<13:58,  2.49s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  6%|▌         | 20/355 [00:41<13:18,  2.38s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  6%|▌         | 21/355 [00:44<13:06,  2.36s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  6%|▌         | 22/355 [00:46<13:38,  2.46s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  6%|▋         | 23/355 [00:49<13:49,  2.50s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  7%|▋         | 24/355 [00:51<13:15,  2.40s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2890 [00:00<?, ? examples/s]

  7%|▋         | 25/355 [00:52<10:47,  1.96s/it]

Saving the dataset (0/1 shards):   0%|          | 0/350 [00:00<?, ? examples/s]

  7%|▋         | 26/355 [00:52<07:45,  1.41s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5220 [00:00<?, ? examples/s]

  8%|▊         | 27/355 [00:53<07:20,  1.34s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5250 [00:00<?, ? examples/s]

  8%|▊         | 28/355 [00:54<06:59,  1.28s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4860 [00:00<?, ? examples/s]

  8%|▊         | 29/355 [00:56<06:41,  1.23s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  8%|▊         | 30/355 [00:58<08:50,  1.63s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  9%|▊         | 31/355 [01:00<09:44,  1.80s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5250 [00:00<?, ? examples/s]

  9%|▉         | 32/355 [01:02<08:45,  1.63s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

  9%|▉         | 33/355 [01:04<09:34,  1.78s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 10%|▉         | 34/355 [01:06<10:07,  1.89s/it]

Saving the dataset (0/1 shards):   0%|          | 0/7080 [00:00<?, ? examples/s]

 10%|▉         | 35/355 [01:08<10:06,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/350 [00:00<?, ? examples/s]

 10%|█         | 36/355 [01:08<07:15,  1.36s/it]

Saving the dataset (0/1 shards):   0%|          | 0/590 [00:00<?, ? examples/s]

 10%|█         | 37/355 [01:08<05:22,  1.01s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5250 [00:00<?, ? examples/s]

 11%|█         | 38/355 [01:09<05:42,  1.08s/it]

Saving the dataset (0/1 shards):   0%|          | 0/7081 [00:00<?, ? examples/s]

 11%|█         | 39/355 [01:11<06:57,  1.32s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1670 [00:00<?, ? examples/s]

 11%|█▏        | 40/355 [01:12<05:30,  1.05s/it]

Saving the dataset (0/1 shards):   0%|          | 0/9220 [00:00<?, ? examples/s]

 12%|█▏        | 41/355 [01:14<07:29,  1.43s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 12%|█▏        | 42/355 [01:16<08:34,  1.64s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 12%|█▏        | 43/355 [01:18<09:41,  1.86s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 12%|█▏        | 44/355 [01:21<10:27,  2.02s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 13%|█▎        | 45/355 [01:23<10:50,  2.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 13%|█▎        | 46/355 [01:25<10:48,  2.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 13%|█▎        | 47/355 [01:27<10:51,  2.11s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5640 [00:00<?, ? examples/s]

 14%|█▎        | 48/355 [01:29<09:39,  1.89s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 14%|█▍        | 49/355 [01:31<10:30,  2.06s/it]

Saving the dataset (0/1 shards):   0%|          | 0/200 [00:00<?, ? examples/s]

 14%|█▍        | 50/355 [01:31<07:29,  1.47s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 14%|█▍        | 51/355 [01:33<08:29,  1.68s/it]

Saving the dataset (0/1 shards):   0%|          | 0/500 [00:00<?, ? examples/s]

 15%|█▍        | 52/355 [01:34<06:10,  1.22s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 15%|█▍        | 53/355 [01:36<07:51,  1.56s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 15%|█▌        | 54/355 [01:38<08:53,  1.77s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1650 [00:00<?, ? examples/s]

 15%|█▌        | 55/355 [01:39<06:52,  1.37s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 16%|█▌        | 56/355 [01:41<08:07,  1.63s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 16%|█▌        | 57/355 [01:43<09:01,  1.82s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 16%|█▋        | 58/355 [01:45<09:33,  1.93s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 17%|█▋        | 59/355 [01:48<10:11,  2.06s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 17%|█▋        | 60/355 [01:50<10:37,  2.16s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 17%|█▋        | 61/355 [01:52<10:45,  2.19s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 17%|█▋        | 62/355 [01:55<10:41,  2.19s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 18%|█▊        | 63/355 [01:57<11:02,  2.27s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 18%|█▊        | 64/355 [01:59<10:50,  2.24s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 18%|█▊        | 65/355 [02:01<10:48,  2.24s/it]

Saving the dataset (0/1 shards):   0%|          | 0/3465 [00:00<?, ? examples/s]

 19%|█▊        | 66/355 [02:02<08:45,  1.82s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 19%|█▉        | 67/355 [02:05<09:35,  2.00s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 19%|█▉        | 68/355 [02:07<09:41,  2.03s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 19%|█▉        | 69/355 [02:09<09:41,  2.03s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 20%|█▉        | 70/355 [02:11<09:47,  2.06s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5220 [00:00<?, ? examples/s]

 20%|██        | 71/355 [02:12<08:33,  1.81s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 20%|██        | 72/355 [02:14<09:05,  1.93s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 21%|██        | 73/355 [02:17<09:52,  2.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1650 [00:00<?, ? examples/s]

 21%|██        | 74/355 [02:17<07:28,  1.59s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 21%|██        | 75/355 [02:20<08:24,  1.80s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 21%|██▏       | 76/355 [02:22<09:32,  2.05s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 22%|██▏       | 77/355 [02:25<10:13,  2.21s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 22%|██▏       | 78/355 [02:27<10:11,  2.21s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 22%|██▏       | 79/355 [02:29<10:25,  2.27s/it]

Saving the dataset (0/1 shards):   0%|          | 0/8350 [00:00<?, ? examples/s]

 23%|██▎       | 80/355 [02:31<09:48,  2.14s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 23%|██▎       | 81/355 [02:33<09:53,  2.17s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1743 [00:00<?, ? examples/s]

 23%|██▎       | 82/355 [02:34<07:36,  1.67s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 23%|██▎       | 83/355 [02:36<08:40,  1.91s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 24%|██▎       | 84/355 [02:39<08:59,  1.99s/it]

Saving the dataset (0/1 shards):   0%|          | 0/603 [00:00<?, ? examples/s]

 24%|██▍       | 85/355 [02:39<06:31,  1.45s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 24%|██▍       | 86/355 [02:41<07:35,  1.69s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4956 [00:00<?, ? examples/s]

 25%|██▍       | 87/355 [02:42<06:44,  1.51s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 25%|██▍       | 88/355 [02:44<07:32,  1.70s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 25%|██▌       | 89/355 [02:47<08:19,  1.88s/it]

Saving the dataset (0/1 shards):   0%|          | 0/590 [00:00<?, ? examples/s]

 25%|██▌       | 90/355 [02:47<06:03,  1.37s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 26%|██▌       | 91/355 [02:49<07:17,  1.66s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 26%|██▌       | 92/355 [02:51<08:02,  1.83s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 26%|██▌       | 93/355 [02:54<09:19,  2.14s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4860 [00:00<?, ? examples/s]

 26%|██▋       | 94/355 [02:55<08:05,  1.86s/it]

Saving the dataset (0/1 shards):   0%|          | 0/912 [00:00<?, ? examples/s]

 27%|██▋       | 95/355 [02:56<06:01,  1.39s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 27%|██▋       | 96/355 [02:58<07:08,  1.66s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 27%|██▋       | 97/355 [03:00<08:09,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 28%|██▊       | 98/355 [03:03<08:41,  2.03s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 28%|██▊       | 99/355 [03:05<09:00,  2.11s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 28%|██▊       | 100/355 [03:08<09:37,  2.26s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 28%|██▊       | 101/355 [03:10<09:45,  2.30s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 29%|██▊       | 102/355 [03:13<10:22,  2.46s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 29%|██▉       | 103/355 [03:15<10:08,  2.41s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 29%|██▉       | 104/355 [03:17<09:41,  2.32s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4950 [00:00<?, ? examples/s]

 30%|██▉       | 105/355 [03:18<08:07,  1.95s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 30%|██▉       | 106/355 [03:21<08:26,  2.03s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 30%|███       | 107/355 [03:23<09:23,  2.27s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 30%|███       | 108/355 [03:26<09:08,  2.22s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2290 [00:00<?, ? examples/s]

 31%|███       | 109/355 [03:26<07:04,  1.72s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 31%|███       | 110/355 [03:28<07:34,  1.86s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 31%|███▏      | 111/355 [03:31<08:17,  2.04s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 32%|███▏      | 112/355 [03:33<08:42,  2.15s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 32%|███▏      | 113/355 [03:35<08:46,  2.17s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 32%|███▏      | 114/355 [03:38<08:49,  2.20s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5640 [00:00<?, ? examples/s]

 32%|███▏      | 115/355 [03:39<07:34,  1.89s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 33%|███▎      | 116/355 [03:41<07:54,  1.98s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 33%|███▎      | 117/355 [03:43<07:59,  2.01s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 33%|███▎      | 118/355 [03:45<07:59,  2.02s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1120 [00:00<?, ? examples/s]

 34%|███▎      | 119/355 [03:45<05:54,  1.50s/it]

Saving the dataset (0/1 shards):   0%|          | 0/600 [00:00<?, ? examples/s]

 34%|███▍      | 120/355 [03:46<04:22,  1.12s/it]

Saving the dataset (0/1 shards):   0%|          | 0/9220 [00:00<?, ? examples/s]

 34%|███▍      | 121/355 [03:48<05:23,  1.38s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 34%|███▍      | 122/355 [03:50<06:28,  1.67s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 35%|███▍      | 123/355 [03:52<07:01,  1.82s/it]

Saving the dataset (0/1 shards):   0%|          | 0/910 [00:00<?, ? examples/s]

 35%|███▍      | 124/355 [03:52<05:11,  1.35s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1120 [00:00<?, ? examples/s]

 35%|███▌      | 125/355 [03:53<03:56,  1.03s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4950 [00:00<?, ? examples/s]

 35%|███▌      | 126/355 [03:54<04:04,  1.07s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 36%|███▌      | 127/355 [03:56<05:13,  1.37s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 36%|███▌      | 128/355 [03:59<06:43,  1.78s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 36%|███▋      | 129/355 [04:01<06:59,  1.86s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 37%|███▋      | 130/355 [04:03<07:51,  2.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 37%|███▋      | 131/355 [04:06<07:55,  2.12s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 37%|███▋      | 132/355 [04:08<08:30,  2.29s/it]

Saving the dataset (0/1 shards):   0%|          | 0/3460 [00:00<?, ? examples/s]

 37%|███▋      | 133/355 [04:09<06:45,  1.83s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 38%|███▊      | 134/355 [04:11<07:05,  1.92s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 38%|███▊      | 135/355 [04:13<07:24,  2.02s/it]

Saving the dataset (0/1 shards):   0%|          | 0/7090 [00:00<?, ? examples/s]

 38%|███▊      | 136/355 [04:15<06:55,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 39%|███▊      | 137/355 [04:18<07:50,  2.16s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 39%|███▉      | 138/355 [04:20<08:15,  2.28s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4860 [00:00<?, ? examples/s]

 39%|███▉      | 139/355 [04:21<06:54,  1.92s/it]

Saving the dataset (0/1 shards):   0%|          | 0/3460 [00:00<?, ? examples/s]

 39%|███▉      | 140/355 [04:22<05:42,  1.59s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 40%|███▉      | 141/355 [04:24<06:24,  1.80s/it]

Saving the dataset (0/1 shards):   0%|          | 0/600 [00:00<?, ? examples/s]

 40%|████      | 142/355 [04:25<04:40,  1.32s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 40%|████      | 143/355 [04:27<05:54,  1.67s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 41%|████      | 144/355 [04:29<06:23,  1.82s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 41%|████      | 145/355 [04:32<07:01,  2.01s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 41%|████      | 146/355 [04:34<07:19,  2.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5220 [00:00<?, ? examples/s]

 41%|████▏     | 147/355 [04:35<06:22,  1.84s/it]

Saving the dataset (0/1 shards):   0%|          | 0/910 [00:00<?, ? examples/s]

 42%|████▏     | 148/355 [04:36<04:42,  1.37s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 42%|████▏     | 149/355 [04:38<05:27,  1.59s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5640 [00:00<?, ? examples/s]

 42%|████▏     | 150/355 [04:39<05:04,  1.49s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5220 [00:00<?, ? examples/s]

 43%|████▎     | 151/355 [04:40<04:41,  1.38s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 43%|████▎     | 152/355 [04:42<05:35,  1.65s/it]

Saving the dataset (0/1 shards):   0%|          | 0/9220 [00:00<?, ? examples/s]

 43%|████▎     | 153/355 [04:44<05:52,  1.74s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 43%|████▎     | 154/355 [04:46<06:12,  1.85s/it]

Saving the dataset (0/1 shards):   0%|          | 0/590 [00:00<?, ? examples/s]

 44%|████▎     | 155/355 [04:47<04:30,  1.35s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 44%|████▍     | 156/355 [04:49<05:17,  1.59s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 44%|████▍     | 157/355 [04:51<06:12,  1.88s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 45%|████▍     | 158/355 [04:54<07:02,  2.14s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 45%|████▍     | 159/355 [04:56<07:04,  2.17s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 45%|████▌     | 160/355 [04:58<07:01,  2.16s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1120 [00:00<?, ? examples/s]

 45%|████▌     | 161/355 [04:59<05:11,  1.60s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 46%|████▌     | 162/355 [05:01<05:42,  1.77s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 46%|████▌     | 163/355 [05:03<06:11,  1.94s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 46%|████▌     | 164/355 [05:05<06:14,  1.96s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 46%|████▋     | 165/355 [05:07<06:24,  2.02s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 47%|████▋     | 166/355 [05:10<06:35,  2.09s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 47%|████▋     | 167/355 [05:12<06:52,  2.19s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 47%|████▋     | 168/355 [05:14<06:56,  2.23s/it]

Saving the dataset (0/1 shards):   0%|          | 0/350 [00:00<?, ? examples/s]

 48%|████▊     | 169/355 [05:15<04:57,  1.60s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 48%|████▊     | 170/355 [05:17<05:24,  1.76s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 48%|████▊     | 171/355 [05:19<05:49,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/8350 [00:00<?, ? examples/s]

 48%|████▊     | 172/355 [05:21<05:41,  1.87s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 49%|████▊     | 173/355 [05:23<06:05,  2.01s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 49%|████▉     | 174/355 [05:25<06:11,  2.05s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 49%|████▉     | 175/355 [05:27<06:18,  2.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 50%|████▉     | 176/355 [05:30<06:36,  2.22s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 50%|████▉     | 177/355 [05:32<06:30,  2.20s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 50%|█████     | 178/355 [05:34<06:36,  2.24s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 50%|█████     | 179/355 [05:37<06:54,  2.36s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 51%|█████     | 180/355 [05:40<07:10,  2.46s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 51%|█████     | 181/355 [05:42<06:52,  2.37s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 51%|█████▏    | 182/355 [05:44<06:42,  2.33s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 52%|█████▏    | 183/355 [05:46<06:25,  2.24s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2040 [00:00<?, ? examples/s]

 52%|█████▏    | 184/355 [05:47<04:52,  1.71s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 52%|█████▏    | 185/355 [05:49<05:17,  1.87s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2040 [00:00<?, ? examples/s]

 52%|█████▏    | 186/355 [05:49<04:06,  1.46s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 53%|█████▎    | 187/355 [05:52<04:44,  1.69s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 53%|█████▎    | 188/355 [05:54<05:07,  1.84s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2288 [00:00<?, ? examples/s]

 53%|█████▎    | 189/355 [05:54<04:01,  1.45s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 54%|█████▎    | 190/355 [05:57<04:37,  1.68s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 54%|█████▍    | 191/355 [05:59<05:05,  1.86s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 54%|█████▍    | 192/355 [06:01<05:23,  1.99s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4950 [00:00<?, ? examples/s]

 54%|█████▍    | 193/355 [06:02<04:42,  1.74s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1670 [00:00<?, ? examples/s]

 55%|█████▍    | 194/355 [06:03<03:35,  1.34s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 55%|█████▍    | 195/355 [06:05<04:19,  1.62s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 55%|█████▌    | 196/355 [06:07<04:42,  1.78s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 55%|█████▌    | 197/355 [06:09<04:55,  1.87s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 56%|█████▌    | 198/355 [06:11<05:05,  1.95s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 56%|█████▌    | 199/355 [06:13<05:14,  2.02s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 56%|█████▋    | 200/355 [06:16<05:14,  2.03s/it]

Saving the dataset (0/1 shards):   0%|          | 0/910 [00:00<?, ? examples/s]

 57%|█████▋    | 201/355 [06:16<03:50,  1.50s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 57%|█████▋    | 202/355 [06:18<04:20,  1.70s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 57%|█████▋    | 203/355 [06:20<04:47,  1.89s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 57%|█████▋    | 204/355 [06:22<04:56,  1.96s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 58%|█████▊    | 205/355 [06:25<04:59,  2.00s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 58%|█████▊    | 206/355 [06:27<05:15,  2.11s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 58%|█████▊    | 207/355 [06:29<05:18,  2.15s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 59%|█████▊    | 208/355 [06:31<05:14,  2.14s/it]

Saving the dataset (0/1 shards):   0%|          | 0/8350 [00:00<?, ? examples/s]

 59%|█████▉    | 209/355 [06:33<04:56,  2.03s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 59%|█████▉    | 210/355 [06:35<05:07,  2.12s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 59%|█████▉    | 211/355 [06:38<05:35,  2.33s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 60%|█████▉    | 212/355 [06:40<05:21,  2.25s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 60%|██████    | 213/355 [06:43<05:41,  2.40s/it]

Saving the dataset (0/1 shards):   0%|          | 0/500 [00:00<?, ? examples/s]

 60%|██████    | 214/355 [06:43<04:03,  1.73s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 61%|██████    | 215/355 [06:45<04:14,  1.81s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1655 [00:00<?, ? examples/s]

 61%|██████    | 216/355 [06:46<03:14,  1.40s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 61%|██████    | 217/355 [06:48<03:46,  1.64s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 61%|██████▏   | 218/355 [06:50<04:10,  1.83s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4860 [00:00<?, ? examples/s]

 62%|██████▏   | 219/355 [06:51<03:42,  1.64s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 62%|██████▏   | 220/355 [06:53<03:58,  1.77s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 62%|██████▏   | 221/355 [06:56<04:21,  1.95s/it]

Saving the dataset (0/1 shards):   0%|          | 0/7075 [00:00<?, ? examples/s]

 63%|██████▎   | 222/355 [06:58<04:20,  1.95s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 63%|██████▎   | 223/355 [07:00<04:23,  2.00s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 63%|██████▎   | 224/355 [07:02<04:36,  2.11s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 63%|██████▎   | 225/355 [07:04<04:33,  2.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 64%|██████▎   | 226/355 [07:06<04:32,  2.12s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 64%|██████▍   | 227/355 [07:08<04:29,  2.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/910 [00:00<?, ? examples/s]

 64%|██████▍   | 228/355 [07:09<03:16,  1.55s/it]

Saving the dataset (0/1 shards):   0%|          | 0/7090 [00:00<?, ? examples/s]

 65%|██████▍   | 229/355 [07:10<03:18,  1.58s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1650 [00:00<?, ? examples/s]

 65%|██████▍   | 230/355 [07:11<02:34,  1.23s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 65%|██████▌   | 231/355 [07:13<03:19,  1.61s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 65%|██████▌   | 232/355 [07:16<03:52,  1.89s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 66%|██████▌   | 233/355 [07:18<04:09,  2.05s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 66%|██████▌   | 234/355 [07:20<04:10,  2.07s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 66%|██████▌   | 235/355 [07:23<04:22,  2.18s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 66%|██████▋   | 236/355 [07:25<04:17,  2.16s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 67%|██████▋   | 237/355 [07:27<04:23,  2.23s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 67%|██████▋   | 238/355 [07:29<04:12,  2.16s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 67%|██████▋   | 239/355 [07:32<04:12,  2.17s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 68%|██████▊   | 240/355 [07:34<04:07,  2.15s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 68%|██████▊   | 241/355 [07:36<04:06,  2.16s/it]

Saving the dataset (0/1 shards):   0%|          | 0/350 [00:00<?, ? examples/s]

 68%|██████▊   | 242/355 [07:36<02:55,  1.56s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 68%|██████▊   | 243/355 [07:38<03:27,  1.85s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 69%|██████▊   | 244/355 [07:41<03:49,  2.06s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5220 [00:00<?, ? examples/s]

 69%|██████▉   | 245/355 [07:42<03:17,  1.80s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 69%|██████▉   | 246/355 [07:44<03:29,  1.92s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 70%|██████▉   | 247/355 [07:47<03:54,  2.17s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 70%|██████▉   | 248/355 [07:49<03:51,  2.16s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 70%|███████   | 249/355 [07:52<03:53,  2.20s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 70%|███████   | 250/355 [07:54<03:49,  2.18s/it]

Saving the dataset (0/1 shards):   0%|          | 0/200 [00:00<?, ? examples/s]

 71%|███████   | 251/355 [07:54<02:42,  1.56s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 71%|███████   | 252/355 [07:56<03:07,  1.82s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 71%|███████▏  | 253/355 [07:58<03:13,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 72%|███████▏  | 254/355 [08:01<03:19,  1.98s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5250 [00:00<?, ? examples/s]

 72%|███████▏  | 255/355 [08:02<02:51,  1.72s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2040 [00:00<?, ? examples/s]

 72%|███████▏  | 256/355 [08:02<02:12,  1.34s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 72%|███████▏  | 257/355 [08:04<02:38,  1.62s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 73%|███████▎  | 258/355 [08:06<02:51,  1.76s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 73%|███████▎  | 259/355 [08:09<03:02,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/8350 [00:00<?, ? examples/s]

 73%|███████▎  | 260/355 [08:11<02:58,  1.88s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1650 [00:00<?, ? examples/s]

 74%|███████▎  | 261/355 [08:11<02:14,  1.43s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 74%|███████▍  | 262/355 [08:13<02:31,  1.63s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 74%|███████▍  | 263/355 [08:15<02:53,  1.88s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4860 [00:00<?, ? examples/s]

 74%|███████▍  | 264/355 [08:17<02:30,  1.65s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 75%|███████▍  | 265/355 [08:19<02:41,  1.80s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 75%|███████▍  | 266/355 [08:21<02:49,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 75%|███████▌  | 267/355 [08:23<02:56,  2.01s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 75%|███████▌  | 268/355 [08:25<03:01,  2.08s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 76%|███████▌  | 269/355 [08:28<03:01,  2.11s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 76%|███████▌  | 270/355 [08:30<02:58,  2.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 76%|███████▋  | 271/355 [08:32<02:58,  2.12s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 77%|███████▋  | 272/355 [08:34<03:03,  2.21s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1120 [00:00<?, ? examples/s]

 77%|███████▋  | 273/355 [08:35<02:15,  1.65s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 77%|███████▋  | 274/355 [08:37<02:36,  1.94s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 77%|███████▋  | 275/355 [08:40<02:46,  2.09s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2290 [00:00<?, ? examples/s]

 78%|███████▊  | 276/355 [08:40<02:07,  1.62s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 78%|███████▊  | 277/355 [08:43<02:29,  1.92s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 78%|███████▊  | 278/355 [08:45<02:34,  2.01s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 79%|███████▊  | 279/355 [08:47<02:37,  2.07s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 79%|███████▉  | 280/355 [08:50<02:45,  2.20s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 79%|███████▉  | 281/355 [08:52<02:56,  2.38s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 79%|███████▉  | 282/355 [08:55<02:54,  2.39s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 80%|███████▉  | 283/355 [08:57<02:54,  2.42s/it]

Saving the dataset (0/1 shards):   0%|          | 0/3130 [00:00<?, ? examples/s]

 80%|████████  | 284/355 [08:58<02:20,  1.98s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 80%|████████  | 285/355 [09:01<02:29,  2.13s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 81%|████████  | 286/355 [09:03<02:33,  2.23s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 81%|████████  | 287/355 [09:05<02:29,  2.19s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 81%|████████  | 288/355 [09:08<02:30,  2.24s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 81%|████████▏ | 289/355 [09:10<02:33,  2.32s/it]

Saving the dataset (0/1 shards):   0%|          | 0/4950 [00:00<?, ? examples/s]

 82%|████████▏ | 290/355 [09:11<02:05,  1.93s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1120 [00:00<?, ? examples/s]

 82%|████████▏ | 291/355 [09:12<01:32,  1.44s/it]

Saving the dataset (0/1 shards):   0%|          | 0/200 [00:00<?, ? examples/s]

 82%|████████▏ | 292/355 [09:12<01:05,  1.04s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1670 [00:00<?, ? examples/s]

 83%|████████▎ | 293/355 [09:12<00:52,  1.17it/s]

Saving the dataset (0/1 shards):   0%|          | 0/348 [00:00<?, ? examples/s]

 83%|████████▎ | 294/355 [09:12<00:38,  1.57it/s]

Saving the dataset (0/1 shards):   0%|          | 0/3130 [00:00<?, ? examples/s]

 83%|████████▎ | 295/355 [09:13<00:39,  1.52it/s]

Saving the dataset (0/1 shards):   0%|          | 0/600 [00:00<?, ? examples/s]

 83%|████████▎ | 296/355 [09:13<00:30,  1.95it/s]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 84%|████████▎ | 297/355 [09:15<00:57,  1.01it/s]

Saving the dataset (0/1 shards):   0%|          | 0/3130 [00:00<?, ? examples/s]

 84%|████████▍ | 298/355 [09:16<00:53,  1.07it/s]

Saving the dataset (0/1 shards):   0%|          | 0/500 [00:00<?, ? examples/s]

 84%|████████▍ | 299/355 [09:16<00:39,  1.43it/s]

Saving the dataset (0/1 shards):   0%|          | 0/1670 [00:00<?, ? examples/s]

 85%|████████▍ | 300/355 [09:17<00:33,  1.65it/s]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 85%|████████▍ | 301/355 [09:19<00:57,  1.07s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 85%|████████▌ | 302/355 [09:21<01:12,  1.36s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 85%|████████▌ | 303/355 [09:23<01:24,  1.62s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 86%|████████▌ | 304/355 [09:25<01:34,  1.86s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 86%|████████▌ | 305/355 [09:28<01:39,  1.99s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 86%|████████▌ | 306/355 [09:30<01:40,  2.05s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 86%|████████▋ | 307/355 [09:32<01:43,  2.16s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 87%|████████▋ | 308/355 [09:35<01:48,  2.30s/it]

Saving the dataset (0/1 shards):   0%|          | 0/200 [00:00<?, ? examples/s]

 87%|████████▋ | 309/355 [09:35<01:15,  1.64s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 87%|████████▋ | 310/355 [09:37<01:24,  1.87s/it]

Saving the dataset (0/1 shards):   0%|          | 0/1670 [00:00<?, ? examples/s]

 88%|████████▊ | 311/355 [09:38<01:03,  1.44s/it]

Saving the dataset (0/1 shards):   0%|          | 0/8348 [00:00<?, ? examples/s]

 88%|████████▊ | 312/355 [09:40<01:06,  1.55s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2290 [00:00<?, ? examples/s]

 88%|████████▊ | 313/355 [09:40<00:52,  1.24s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 88%|████████▊ | 314/355 [09:42<01:01,  1.51s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2040 [00:00<?, ? examples/s]

 89%|████████▊ | 315/355 [09:43<00:48,  1.21s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 89%|████████▉ | 316/355 [09:45<00:59,  1.53s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 89%|████████▉ | 317/355 [09:47<01:05,  1.73s/it]

Saving the dataset (0/1 shards):   0%|          | 0/600 [00:00<?, ? examples/s]

 90%|████████▉ | 318/355 [09:48<00:46,  1.26s/it]

Saving the dataset (0/1 shards):   0%|          | 0/590 [00:00<?, ? examples/s]

 90%|████████▉ | 319/355 [09:48<00:33,  1.07it/s]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 90%|█████████ | 320/355 [09:50<00:46,  1.31s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 90%|█████████ | 321/355 [09:52<00:54,  1.60s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 91%|█████████ | 322/355 [09:54<00:58,  1.76s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 91%|█████████ | 323/355 [09:57<01:00,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/200 [00:00<?, ? examples/s]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 92%|█████████▏| 325/355 [09:59<00:47,  1.57s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 92%|█████████▏| 326/355 [10:02<00:57,  2.00s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 92%|█████████▏| 327/355 [10:04<00:57,  2.04s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5646 [00:00<?, ? examples/s]

 92%|█████████▏| 328/355 [10:06<00:49,  1.83s/it]

Saving the dataset (0/1 shards):   0%|          | 0/9220 [00:00<?, ? examples/s]

 93%|█████████▎| 329/355 [10:08<00:50,  1.92s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2040 [00:00<?, ? examples/s]

 93%|█████████▎| 330/355 [10:08<00:37,  1.51s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 93%|█████████▎| 331/355 [10:11<00:44,  1.86s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 94%|█████████▎| 332/355 [10:13<00:45,  1.96s/it]

Saving the dataset (0/1 shards):   0%|          | 0/3130 [00:00<?, ? examples/s]

 94%|█████████▍| 333/355 [10:14<00:35,  1.62s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5248 [00:00<?, ? examples/s]

 94%|█████████▍| 334/355 [10:15<00:31,  1.51s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 94%|█████████▍| 335/355 [10:18<00:34,  1.75s/it]

Saving the dataset (0/1 shards):   0%|          | 0/9220 [00:00<?, ? examples/s]

 95%|█████████▍| 336/355 [10:20<00:36,  1.90s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 95%|█████████▍| 337/355 [10:22<00:36,  2.03s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 95%|█████████▌| 338/355 [10:24<00:35,  2.11s/it]

Saving the dataset (0/1 shards):   0%|          | 0/3460 [00:00<?, ? examples/s]

 95%|█████████▌| 339/355 [10:25<00:27,  1.71s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2973 [00:00<?, ? examples/s]

 96%|█████████▌| 340/355 [10:26<00:22,  1.50s/it]

Saving the dataset (0/1 shards):   0%|          | 0/500 [00:00<?, ? examples/s]

 96%|█████████▌| 341/355 [10:26<00:15,  1.10s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 96%|█████████▋| 342/355 [10:29<00:18,  1.41s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 97%|█████████▋| 343/355 [10:31<00:19,  1.61s/it]

Saving the dataset (0/1 shards):   0%|          | 0/5640 [00:00<?, ? examples/s]

 97%|█████████▋| 344/355 [10:32<00:16,  1.49s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 97%|█████████▋| 345/355 [10:34<00:16,  1.70s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 97%|█████████▋| 346/355 [10:36<00:16,  1.83s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 98%|█████████▊| 347/355 [10:38<00:15,  1.94s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 98%|█████████▊| 348/355 [10:41<00:15,  2.24s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 98%|█████████▊| 349/355 [10:44<00:13,  2.29s/it]

Saving the dataset (0/1 shards):   0%|          | 0/2290 [00:00<?, ? examples/s]

 99%|█████████▊| 350/355 [10:44<00:08,  1.77s/it]

Saving the dataset (0/1 shards):   0%|          | 0/590 [00:00<?, ? examples/s]

 99%|█████████▉| 351/355 [10:44<00:05,  1.29s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 99%|█████████▉| 352/355 [10:47<00:04,  1.57s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

 99%|█████████▉| 353/355 [10:49<00:03,  1.88s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

100%|█████████▉| 354/355 [10:52<00:02,  2.13s/it]

Saving the dataset (0/1 shards):   0%|          | 0/10000 [00:00<?, ? examples/s]

100%|██████████| 355/355 [10:54<00:00,  1.84s/it]


In [38]:
convert_subset("./subsets/t0", "./pytorch_subsets/t0")

  0%|          | 0/3 [00:00<?, ?it/s]

Saving the dataset (0/1 shards):   0%|          | 0/100000 [00:00<?, ? examples/s]

 33%|███▎      | 1/3 [00:23<00:46, 23.43s/it]

Saving the dataset (0/1 shards):   0%|          | 0/100000 [00:00<?, ? examples/s]

 67%|██████▋   | 2/3 [00:45<00:22, 22.75s/it]

Saving the dataset (0/1 shards):   0%|          | 0/100000 [00:00<?, ? examples/s]

100%|██████████| 3/3 [01:08<00:00, 22.77s/it]
