From dac86f58e3d3d720ae55e272f11ce4622a7cc747 Mon Sep 17 00:00:00 2001
From: artitw <artitw@gmail.com>
Date: Sat, 10 Feb 2024 06:54:34 +0000
Subject: [PATCH] Mixtral 8x7B

---
 README.md                                     |   24 -
 ...]_Demo_All.ipynb => Text2Text_Demos.ipynb} |   32 +-
 demos/Text2Text_LLM.ipynb                     | 2767 +---------
 demos/[Text2Text]_Q&A_Assistant.ipynb         | 4562 -----------------
 setup.py                                      |    7 +-
 text2text/__init__.py                         |    2 +-
 text2text/assistant.py                        |  200 +-
 .../langchain/test_text2text_assistant.py     |    2 +-
 text2text/langchain/text2text_assistant.py    |    2 +-
 text2text/mixtral/build_model.py              |  263 +
 text2text/mixtral/custom_layers.py            |  336 ++
 text2text/mixtral/expert_cache.py             |  223 +
 text2text/mixtral/expert_wrapper.py           |  107 +
 text2text/mixtral/packing.py                  |  135 +
 text2text/mixtral/triton_kernels.py           |  586 +++
 text2text/mixtral/utils.py                    |  123 +
 16 files changed, 1924 insertions(+), 7447 deletions(-)
 rename demos/{[Text2Text]_Demo_All.ipynb => Text2Text_Demos.ipynb} (99%)
 delete mode 100644 demos/[Text2Text]_Q&A_Assistant.ipynb
 create mode 100644 text2text/mixtral/build_model.py
 create mode 100644 text2text/mixtral/custom_layers.py
 create mode 100644 text2text/mixtral/expert_cache.py
 create mode 100644 text2text/mixtral/expert_wrapper.py
 create mode 100644 text2text/mixtral/packing.py
 create mode 100644 text2text/mixtral/triton_kernels.py
 create mode 100644 text2text/mixtral/utils.py

diff --git a/README.md b/README.md
index 27166e4..7f2ccb8 100755
--- a/README.md
+++ b/README.md
@@ -36,7 +36,6 @@ Transform texts in a hundred different [languages](https://github.com/artitw/tex
 
 ## Colab Notebooks
 * Assistant (free private ChatGPT LLM alternative) [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/drive/1K6Kk80w9vjFZ7PL9dPRgVuOPuaWcY4ae?usp=sharing)
-* Assistant with knowledge base [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/drive/1hkNgpSmmUA-mzUibqz25xq-E8KYOLuVx?usp=sharing)
 * STF-IDF multilingual search [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/drive/1RaWj5SqWvyC2SsCTGg8IAVcl9G5hOB50?usp=sharing)
 * All examples [![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/drive/1LE_ifTpOGO5QJCKNQYtZe6c_tjbwnulR)
 
@@ -193,29 +192,8 @@ t2t.Transformer.LANGUAGES
 ```
 import text2text as t2t
 asst = t2t.Assistant()
-instructions = "Generate a JSON object that maps English characters as keys and Greek equivalents as values: {"
-res = asst.transform([instructions])
-#[
-#  '{\n"a": "α",\n"b": "β",\n"c": "γ",\n"d": "δ",\n"e": "ε",\n"f": "φ",\n"g": "χ",\n"h": "ι",\n"i": "η",\n"j": "κ",\n"k": "λ",\n"l": "μ",\n"m": "ν",\n"n": "ξ",\n"o": "ο",\n"p": "π",\n"q": "ρ",\n"r": "σ",\n"s": "τ",\n"t": "υ",\n"u": "ύ",\n"v": "φ",\n"w": "χ",\n"x": "ψ",\n"y": "ω",\n"z": "ζ"\n}'
-#]
-
-#OpenAI Completion API
-
-prompt = """
-I have a clove of garlic, some brown rice, a few baby bok choy,
-some olive oil, and a few slices of bacon.
-How can I prepare a meal our of these ingredients?
-"""
-
-input_prompts = [prompt]
-num_tokens = asst.completion_tokens(input_prompts)
-print(num_tokens[0])
-
-results = asst.completion(input_prompts)
-print(results[0])
 
 #OpenAI Chat Completion API
-
 chat_history = [
     {"role": "user",  "content": "Hi"},
     {"role": "assistant", "content": "Hello, how are you?"},
@@ -227,8 +205,6 @@ print(num_tokens)
 result = asst.chat_completion(chat_history, stream=True) #{'role': 'assistant', 'content': '1. Make a list of things to be grateful for.\n2. Go outside and take a walk in nature.\n3. Practice mindfulness meditation.\n4. Connect with a loved one or friend.\n5. Do something kind for someone else.\n6. Engage in a creative activity like drawing or writing.\n7. Read an uplifting book or listen to motivational podcasts.'}
 print(result["content"])
 ```
-- To use a dynamic knowledge base, see [![Q&A Assistant Demo](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/drive/1hkNgpSmmUA-mzUibqz25xq-E8KYOLuVx?usp=sharing)
-- To use with LangChain, see [![LangChain integration](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/drive/1K6Kk80w9vjFZ7PL9dPRgVuOPuaWcY4ae?usp=sharing)
 
 ### Tokenization
 ```
diff --git a/demos/[Text2Text]_Demo_All.ipynb b/demos/Text2Text_Demos.ipynb
similarity index 99%
rename from demos/[Text2Text]_Demo_All.ipynb
rename to demos/Text2Text_Demos.ipynb
index 53bfddc..642a088 100644
--- a/demos/[Text2Text]_Demo_All.ipynb
+++ b/demos/Text2Text_Demos.ipynb
@@ -64,9 +64,20 @@
         "# Run at no cost on Google Colab free tier, so you don't even need your own device.\n",
         "# To add a knowledge base, see https://colab.research.google.com/drive/1hkNgpSmmUA-mzUibqz25xq-E8KYOLuVx?usp=sharing\n",
         "\n",
-        "assistant = t2t.Assistant()\n",
-        "assistant.transform([\"Describe Text2Text in a few words: \"])\n",
-        "#['Text2Text is an AI-powered text generation tool that creates coherent and continuous text based on prompts.']"
+        "asst = t2t.Assistant()\n",
+        "\n",
+        "#OpenAI Chat Completion API\n",
+        "\n",
+        "chat_history = [\n",
+        "    {\"role\": \"user\",  \"content\": \"Hi\"},\n",
+        "    {\"role\": \"assistant\", \"content\": \"Hello, how are you?\"},\n",
+        "    {\"role\": \"user\", \"content\": \"What should I do today?\"}\n",
+        "]\n",
+        "num_tokens = asst.chat_completion_tokens(chat_history) #31\n",
+        "print(num_tokens)\n",
+        "\n",
+        "result = asst.chat_completion(chat_history, stream=True) #{'role': 'assistant', 'content': '1. Make a list of things to be grateful for.\\n2. Go outside and take a walk in nature.\\n3. Practice mindfulness meditation.\\n4. Connect with a loved one or friend.\\n5. Do something kind for someone else.\\n6. Engage in a creative activity like drawing or writing.\\n7. Read an uplifting book or listen to motivational podcasts.'}\n",
+        "print(result[\"content\"])"
       ],
       "metadata": {
         "id": "VPMdUSy9YYRl"
@@ -74,21 +85,6 @@
       "execution_count": null,
       "outputs": []
     },
-    {
-      "cell_type": "code",
-      "source": [
-        "instructions = \"Generate a JSON object that maps English characters as keys and Greek equivalents as values: {\"\n",
-        "assistant.transform([instructions])\n",
-        "# [\n",
-        "#  '{\\n\"a\": \"α\",\\n\"b\": \"β\",\\n\"c\": \"γ\",\\n\"d\": \"δ\",\\n\"e\": \"ε\",\\n\"f\": \"φ\",\\n\"g\": \"χ\",\\n\"h\": \"ι\",\\n\"i\": \"η\",\\n\"j\": \"κ\",\\n\"k\": \"λ\",\\n\"l\": \"μ\",\\n\"m\": \"ν\",\\n\"n\": \"ξ\",\\n\"o\": \"ο\",\\n\"p\": \"π\",\\n\"q\": \"ρ\",\\n\"r\": \"σ\",\\n\"s\": \"τ\",\\n\"t\": \"υ\",\\n\"u\": \"ύ\",\\n\"v\": \"φ\",\\n\"w\": \"χ\",\\n\"x\": \"ψ\",\\n\"y\": \"ω\",\\n\"z\": \"ζ\"\\n}'\n",
-        "# ]"
-      ],
-      "metadata": {
-        "id": "TaEBdeQMXPzb"
-      },
-      "execution_count": null,
-      "outputs": []
-    },
     {
       "cell_type": "code",
       "source": [
diff --git a/demos/Text2Text_LLM.ipynb b/demos/Text2Text_LLM.ipynb
index 8fafb87..14bfa76 100644
--- a/demos/Text2Text_LLM.ipynb
+++ b/demos/Text2Text_LLM.ipynb
@@ -13,2405 +13,7 @@
     "language_info": {
       "name": "python"
     },
-    "accelerator": "GPU",
-    "widgets": {
-      "application/vnd.jupyter.widget-state+json": {
-        "9fe497145b574c22b2c2f62b85a1e708": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_85528a87313d440d86efa9167b1184ea",
-              "IPY_MODEL_ace677d34c3e461c879dc34acc7fb1b8",
-              "IPY_MODEL_7bf57c22b6a1419c9bd12236fbe4b7a7"
-            ],
-            "layout": "IPY_MODEL_bc668e1bd9a8405a9a1b323ec5f304cb"
-          }
-        },
-        "85528a87313d440d86efa9167b1184ea": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_1801ecc6007d4463b49a4e7f2683f372",
-            "placeholder": "​",
-            "style": "IPY_MODEL_020c56ec21ec4cd09fa2a987260b6f75",
-            "value": "Downloading (…)okenizer_config.json: 100%"
-          }
-        },
-        "ace677d34c3e461c879dc34acc7fb1b8": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_b721a0238fc04757996cc9aea8c5d408",
-            "max": 750,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_a20abe24b0f0475da8de44db5f1ed4ec",
-            "value": 750
-          }
-        },
-        "7bf57c22b6a1419c9bd12236fbe4b7a7": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_f7ba096e3e7246fda9b309840cca3aae",
-            "placeholder": "​",
-            "style": "IPY_MODEL_12636d39182d40279145b533196c02f0",
-            "value": " 750/750 [00:00&lt;00:00, 49.4kB/s]"
-          }
-        },
-        "bc668e1bd9a8405a9a1b323ec5f304cb": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "1801ecc6007d4463b49a4e7f2683f372": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "020c56ec21ec4cd09fa2a987260b6f75": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "b721a0238fc04757996cc9aea8c5d408": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "a20abe24b0f0475da8de44db5f1ed4ec": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "f7ba096e3e7246fda9b309840cca3aae": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "12636d39182d40279145b533196c02f0": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "d3226a916c934244ba5d6ddc66486338": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_0f9b0a7a83ed4fe9bcf8f890b346f9af",
-              "IPY_MODEL_038d0c79ec1a4c54b0c094683ba85208",
-              "IPY_MODEL_d6bed9e47a1a4768bab69ad744e6d36e"
-            ],
-            "layout": "IPY_MODEL_f03a8447ff11494ca0dedbe335e2f7ae"
-          }
-        },
-        "0f9b0a7a83ed4fe9bcf8f890b346f9af": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_c26f3d922cf849a682953de7cd9c0e62",
-            "placeholder": "​",
-            "style": "IPY_MODEL_926429ffc72442f2983efe743f6ada15",
-            "value": "Downloading tokenizer.model: 100%"
-          }
-        },
-        "038d0c79ec1a4c54b0c094683ba85208": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_eaf682d3f8b246c7b28edd96df300ca2",
-            "max": 499723,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_7cefd1a675c8492198b89b4335fa111a",
-            "value": 499723
-          }
-        },
-        "d6bed9e47a1a4768bab69ad744e6d36e": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_ef252d20d5664b05bcfbb474337476dd",
-            "placeholder": "​",
-            "style": "IPY_MODEL_73314a861f744497868fe923109671a9",
-            "value": " 500k/500k [00:00&lt;00:00, 7.60MB/s]"
-          }
-        },
-        "f03a8447ff11494ca0dedbe335e2f7ae": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "c26f3d922cf849a682953de7cd9c0e62": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "926429ffc72442f2983efe743f6ada15": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "eaf682d3f8b246c7b28edd96df300ca2": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "7cefd1a675c8492198b89b4335fa111a": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "ef252d20d5664b05bcfbb474337476dd": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "73314a861f744497868fe923109671a9": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "6d01ff138cb64bd3a681b30e645545d8": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_d0a1aeea42274bcab3ac1196349ed301",
-              "IPY_MODEL_46ba9c97facb40c2ad5b625afa06c97b",
-              "IPY_MODEL_31b0d81a0b95448b8d144fe325976d89"
-            ],
-            "layout": "IPY_MODEL_e7193895652b4553b7b72bae15df5d61"
-          }
-        },
-        "d0a1aeea42274bcab3ac1196349ed301": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_38e84577647046e58c324c053c9db801",
-            "placeholder": "​",
-            "style": "IPY_MODEL_058b9fda87c3462f84772f6f8059c187",
-            "value": "Downloading (…)/main/tokenizer.json: 100%"
-          }
-        },
-        "46ba9c97facb40c2ad5b625afa06c97b": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_689a57d20a2b4e84a11ad8003ec5e669",
-            "max": 1842767,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_da654cae5d30469fa11ab1ee5d54c8c6",
-            "value": 1842767
-          }
-        },
-        "31b0d81a0b95448b8d144fe325976d89": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_c4b7d162340e4d41b781d812f6883822",
-            "placeholder": "​",
-            "style": "IPY_MODEL_3cbbdb31235e4e93acf4d1dac9838fd0",
-            "value": " 1.84M/1.84M [00:00&lt;00:00, 9.39MB/s]"
-          }
-        },
-        "e7193895652b4553b7b72bae15df5d61": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "38e84577647046e58c324c053c9db801": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "058b9fda87c3462f84772f6f8059c187": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "689a57d20a2b4e84a11ad8003ec5e669": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "da654cae5d30469fa11ab1ee5d54c8c6": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "c4b7d162340e4d41b781d812f6883822": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "3cbbdb31235e4e93acf4d1dac9838fd0": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "3df3c8dc9ac3476aa87b24a42dbb9ce6": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_7412b71611fa4013bc151cdec1c7acbd",
-              "IPY_MODEL_60fc5d319c534fcc8bb22e50cabde551",
-              "IPY_MODEL_eaab75e47a4e43499987eae98fe48921"
-            ],
-            "layout": "IPY_MODEL_3d35b3d33e3a429a93e2a26e59fd6922"
-          }
-        },
-        "7412b71611fa4013bc151cdec1c7acbd": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_7ce7ed9dda344e7ab6715afa43c18a42",
-            "placeholder": "​",
-            "style": "IPY_MODEL_6073b5f88d2e4833932eeba9a0cc6d89",
-            "value": "Downloading (…)cial_tokens_map.json: 100%"
-          }
-        },
-        "60fc5d319c534fcc8bb22e50cabde551": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_93dea61f05b54e67b96dd02f2ea60821",
-            "max": 438,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_e2206eb4491b4ab688a03af4290d1cea",
-            "value": 438
-          }
-        },
-        "eaab75e47a4e43499987eae98fe48921": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_5d54c94ee8c14443b940e1c0ecf8bd7c",
-            "placeholder": "​",
-            "style": "IPY_MODEL_e4f958f519ad4f6bacae04c57052c260",
-            "value": " 438/438 [00:00&lt;00:00, 34.8kB/s]"
-          }
-        },
-        "3d35b3d33e3a429a93e2a26e59fd6922": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "7ce7ed9dda344e7ab6715afa43c18a42": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "6073b5f88d2e4833932eeba9a0cc6d89": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "93dea61f05b54e67b96dd02f2ea60821": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "e2206eb4491b4ab688a03af4290d1cea": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "5d54c94ee8c14443b940e1c0ecf8bd7c": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "e4f958f519ad4f6bacae04c57052c260": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "ccc13e08c1db4c35afa2f647c3a50d32": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_148c80e050b94051b2b4fd32b6eeae47",
-              "IPY_MODEL_05c742f3e9774fa3877d6f4b689ef61c",
-              "IPY_MODEL_0f0d7b4d40d74fc7bc04d8720f6a3ce9"
-            ],
-            "layout": "IPY_MODEL_dbd39cb47d3a4dbeba15ad56ca0b08c6"
-          }
-        },
-        "148c80e050b94051b2b4fd32b6eeae47": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_756ce530c53445c696f0d1cf3227ba54",
-            "placeholder": "​",
-            "style": "IPY_MODEL_6894f3a083af413e8121a7c906c3dcee",
-            "value": "Downloading (…)lve/main/config.json: 100%"
-          }
-        },
-        "05c742f3e9774fa3877d6f4b689ef61c": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_56607d8ba76b42d7b9c328d8bd033ba0",
-            "max": 953,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_53f68f7dbbfb42998cf1be238bcf3ffd",
-            "value": 953
-          }
-        },
-        "0f0d7b4d40d74fc7bc04d8720f6a3ce9": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_7d0329ad41d747db95016d750f433641",
-            "placeholder": "​",
-            "style": "IPY_MODEL_4ea66ebc91fb4c2e9e66fc219255fb18",
-            "value": " 953/953 [00:00&lt;00:00, 65.1kB/s]"
-          }
-        },
-        "dbd39cb47d3a4dbeba15ad56ca0b08c6": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "756ce530c53445c696f0d1cf3227ba54": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "6894f3a083af413e8121a7c906c3dcee": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "56607d8ba76b42d7b9c328d8bd033ba0": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "53f68f7dbbfb42998cf1be238bcf3ffd": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "7d0329ad41d747db95016d750f433641": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "4ea66ebc91fb4c2e9e66fc219255fb18": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "1a53193421be418e836a1f89dfdde7f1": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_a5c4e8a10e5c430c81f072d55f1e0266",
-              "IPY_MODEL_e1c98877619a4b4bb5ebd68e0056d63d",
-              "IPY_MODEL_92f392c64bde4507bf3b9d0e458c3611"
-            ],
-            "layout": "IPY_MODEL_2093040190ff434996a84336510c2aa4"
-          }
-        },
-        "a5c4e8a10e5c430c81f072d55f1e0266": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_27ac50f2fbf54b428acb7e1971887dd0",
-            "placeholder": "​",
-            "style": "IPY_MODEL_74c052254ed042d296f6efaa778d7462",
-            "value": "Downloading (…)quantize_config.json: 100%"
-          }
-        },
-        "e1c98877619a4b4bb5ebd68e0056d63d": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_0a73093426bd44c38f6400a7aeda8a0a",
-            "max": 187,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_a6520c4a59624ca9a8180acfd9d9d680",
-            "value": 187
-          }
-        },
-        "92f392c64bde4507bf3b9d0e458c3611": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_d298bd0a213f45c6803126c3216d8bbc",
-            "placeholder": "​",
-            "style": "IPY_MODEL_45d188ed6aba42e4b1e071bbfb07209f",
-            "value": " 187/187 [00:00&lt;00:00, 11.9kB/s]"
-          }
-        },
-        "2093040190ff434996a84336510c2aa4": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "27ac50f2fbf54b428acb7e1971887dd0": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "74c052254ed042d296f6efaa778d7462": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "0a73093426bd44c38f6400a7aeda8a0a": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "a6520c4a59624ca9a8180acfd9d9d680": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "d298bd0a213f45c6803126c3216d8bbc": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "45d188ed6aba42e4b1e071bbfb07209f": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "a5b23e2b1a3643ab9fa309be4cafcf64": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_383c0cd0d53d4d619645848e46599395",
-              "IPY_MODEL_b9ee1bd0dadb4aa28318e6d82b4086ab",
-              "IPY_MODEL_9a68ab1967ba43ff88353b19315301be"
-            ],
-            "layout": "IPY_MODEL_58d1eaf1aa824fb69d85699721776f43"
-          }
-        },
-        "383c0cd0d53d4d619645848e46599395": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_c380007be87147ee800ebc7d1fe81344",
-            "placeholder": "​",
-            "style": "IPY_MODEL_6cb54af9ad214074b67f33d6b9bdeaa6",
-            "value": "Downloading model.safetensors: 100%"
-          }
-        },
-        "b9ee1bd0dadb4aa28318e6d82b4086ab": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_a733afd4d5244586a2fa51c026a83cdf",
-            "max": 7259435192,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_8cb5acc31c11441c9c23e53bbbe4101a",
-            "value": 7259435192
-          }
-        },
-        "9a68ab1967ba43ff88353b19315301be": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_3f735fb12e0442d99ba02e6b308a50b1",
-            "placeholder": "​",
-            "style": "IPY_MODEL_9b7e0cde81934b20afcf13c414e17f77",
-            "value": " 7.26G/7.26G [00:55&lt;00:00, 102MB/s]"
-          }
-        },
-        "58d1eaf1aa824fb69d85699721776f43": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "c380007be87147ee800ebc7d1fe81344": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "6cb54af9ad214074b67f33d6b9bdeaa6": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "a733afd4d5244586a2fa51c026a83cdf": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "8cb5acc31c11441c9c23e53bbbe4101a": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "3f735fb12e0442d99ba02e6b308a50b1": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "9b7e0cde81934b20afcf13c414e17f77": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        }
-      }
-    }
+    "accelerator": "GPU"
   },
   "cells": [
     {
@@ -2422,31 +24,32 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "tlg9YpBgnLhE",
-        "outputId": "03518f83-b77e-42e1-d1d8-9416e9863ad9"
+        "outputId": "e8cc3a98-d393-47b7-d4d3-b77d45eb2a6f"
       },
       "outputs": [
         {
           "output_type": "stream",
           "name": "stdout",
           "text": [
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 74.1/74.1 kB 1.8 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 258.1/258.1 kB 11.2 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 1.8/1.8 MB 37.0 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 92.6/92.6 MB 11.1 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 85.6/85.6 kB 12.9 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 17.6/17.6 MB 77.2 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 1.9/1.9 MB 85.4 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 1.3/1.3 MB 79.9 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 7.7/7.7 MB 114.0 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 302.0/302.0 kB 37.1 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 519.6/519.6 kB 54.7 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 1.3/1.3 MB 88.6 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 3.8/3.8 MB 114.4 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 41.9/41.9 kB 5.8 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 49.4/49.4 kB 5.9 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 295.0/295.0 kB 38.5 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 115.3/115.3 kB 16.3 MB/s eta 0:00:00\n",
-            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 134.8/134.8 kB 18.3 MB/s eta 0:00:00\n"
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 74.3/74.3 kB 3.0 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 270.9/270.9 kB 10.2 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 4.8/4.8 MB 30.9 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 105.0/105.0 MB 7.0 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 183.4/183.4 kB 21.0 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 17.6/17.6 MB 27.4 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 806.7/806.7 kB 42.3 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 402.5/402.5 kB 35.9 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 507.1/507.1 kB 34.6 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 12.2/12.2 MB 51.3 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 1.6/1.6 MB 80.3 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 238.5/238.5 kB 29.2 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 54.4/54.4 kB 7.2 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 46.0/46.0 kB 6.2 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 49.4/49.4 kB 7.0 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 86.8/86.8 kB 11.2 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 115.3/115.3 kB 14.1 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 134.8/134.8 kB 20.0 MB/s eta 0:00:00\n",
+            "     ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 134.8/134.8 kB 17.4 MB/s eta 0:00:00\n"
           ]
         }
       ],
@@ -2455,19 +58,6 @@
         "pip install -qq -U text2text"
       ]
     },
-    {
-      "cell_type": "code",
-      "source": [
-        "# Restart to free memory\n",
-        "import os\n",
-        "os._exit(00)"
-      ],
-      "metadata": {
-        "id": "UlCoburxibmE"
-      },
-      "execution_count": null,
-      "outputs": []
-    },
     {
       "cell_type": "code",
       "source": [
@@ -2476,265 +66,10 @@
         "asst = t2t.Assistant()"
       ],
       "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 295,
-          "referenced_widgets": [
-            "9fe497145b574c22b2c2f62b85a1e708",
-            "85528a87313d440d86efa9167b1184ea",
-            "ace677d34c3e461c879dc34acc7fb1b8",
-            "7bf57c22b6a1419c9bd12236fbe4b7a7",
-            "bc668e1bd9a8405a9a1b323ec5f304cb",
-            "1801ecc6007d4463b49a4e7f2683f372",
-            "020c56ec21ec4cd09fa2a987260b6f75",
-            "b721a0238fc04757996cc9aea8c5d408",
-            "a20abe24b0f0475da8de44db5f1ed4ec",
-            "f7ba096e3e7246fda9b309840cca3aae",
-            "12636d39182d40279145b533196c02f0",
-            "d3226a916c934244ba5d6ddc66486338",
-            "0f9b0a7a83ed4fe9bcf8f890b346f9af",
-            "038d0c79ec1a4c54b0c094683ba85208",
-            "d6bed9e47a1a4768bab69ad744e6d36e",
-            "f03a8447ff11494ca0dedbe335e2f7ae",
-            "c26f3d922cf849a682953de7cd9c0e62",
-            "926429ffc72442f2983efe743f6ada15",
-            "eaf682d3f8b246c7b28edd96df300ca2",
-            "7cefd1a675c8492198b89b4335fa111a",
-            "ef252d20d5664b05bcfbb474337476dd",
-            "73314a861f744497868fe923109671a9",
-            "6d01ff138cb64bd3a681b30e645545d8",
-            "d0a1aeea42274bcab3ac1196349ed301",
-            "46ba9c97facb40c2ad5b625afa06c97b",
-            "31b0d81a0b95448b8d144fe325976d89",
-            "e7193895652b4553b7b72bae15df5d61",
-            "38e84577647046e58c324c053c9db801",
-            "058b9fda87c3462f84772f6f8059c187",
-            "689a57d20a2b4e84a11ad8003ec5e669",
-            "da654cae5d30469fa11ab1ee5d54c8c6",
-            "c4b7d162340e4d41b781d812f6883822",
-            "3cbbdb31235e4e93acf4d1dac9838fd0",
-            "3df3c8dc9ac3476aa87b24a42dbb9ce6",
-            "7412b71611fa4013bc151cdec1c7acbd",
-            "60fc5d319c534fcc8bb22e50cabde551",
-            "eaab75e47a4e43499987eae98fe48921",
-            "3d35b3d33e3a429a93e2a26e59fd6922",
-            "7ce7ed9dda344e7ab6715afa43c18a42",
-            "6073b5f88d2e4833932eeba9a0cc6d89",
-            "93dea61f05b54e67b96dd02f2ea60821",
-            "e2206eb4491b4ab688a03af4290d1cea",
-            "5d54c94ee8c14443b940e1c0ecf8bd7c",
-            "e4f958f519ad4f6bacae04c57052c260",
-            "ccc13e08c1db4c35afa2f647c3a50d32",
-            "148c80e050b94051b2b4fd32b6eeae47",
-            "05c742f3e9774fa3877d6f4b689ef61c",
-            "0f0d7b4d40d74fc7bc04d8720f6a3ce9",
-            "dbd39cb47d3a4dbeba15ad56ca0b08c6",
-            "756ce530c53445c696f0d1cf3227ba54",
-            "6894f3a083af413e8121a7c906c3dcee",
-            "56607d8ba76b42d7b9c328d8bd033ba0",
-            "53f68f7dbbfb42998cf1be238bcf3ffd",
-            "7d0329ad41d747db95016d750f433641",
-            "4ea66ebc91fb4c2e9e66fc219255fb18",
-            "1a53193421be418e836a1f89dfdde7f1",
-            "a5c4e8a10e5c430c81f072d55f1e0266",
-            "e1c98877619a4b4bb5ebd68e0056d63d",
-            "92f392c64bde4507bf3b9d0e458c3611",
-            "2093040190ff434996a84336510c2aa4",
-            "27ac50f2fbf54b428acb7e1971887dd0",
-            "74c052254ed042d296f6efaa778d7462",
-            "0a73093426bd44c38f6400a7aeda8a0a",
-            "a6520c4a59624ca9a8180acfd9d9d680",
-            "d298bd0a213f45c6803126c3216d8bbc",
-            "45d188ed6aba42e4b1e071bbfb07209f",
-            "a5b23e2b1a3643ab9fa309be4cafcf64",
-            "383c0cd0d53d4d619645848e46599395",
-            "b9ee1bd0dadb4aa28318e6d82b4086ab",
-            "9a68ab1967ba43ff88353b19315301be",
-            "58d1eaf1aa824fb69d85699721776f43",
-            "c380007be87147ee800ebc7d1fe81344",
-            "6cb54af9ad214074b67f33d6b9bdeaa6",
-            "a733afd4d5244586a2fa51c026a83cdf",
-            "8cb5acc31c11441c9c23e53bbbe4101a",
-            "3f735fb12e0442d99ba02e6b308a50b1",
-            "9b7e0cde81934b20afcf13c414e17f77"
-          ]
-        },
-        "id": "NL3SY2o5gwNh",
-        "outputId": "f083d548-cad3-46f4-867b-d36843237b6a"
-      },
-      "execution_count": null,
-      "outputs": [
-        {
-          "output_type": "stream",
-          "name": "stdout",
-          "text": [
-            "Better speed can be achieved with apex installed.\n"
-          ]
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)okenizer_config.json:   0%|          | 0.00/750 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "9fe497145b574c22b2c2f62b85a1e708"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading tokenizer.model:   0%|          | 0.00/500k [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "d3226a916c934244ba5d6ddc66486338"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)/main/tokenizer.json:   0%|          | 0.00/1.84M [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "6d01ff138cb64bd3a681b30e645545d8"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)cial_tokens_map.json:   0%|          | 0.00/438 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "3df3c8dc9ac3476aa87b24a42dbb9ce6"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)lve/main/config.json:   0%|          | 0.00/953 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "ccc13e08c1db4c35afa2f647c3a50d32"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)quantize_config.json:   0%|          | 0.00/187 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "1a53193421be418e836a1f89dfdde7f1"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading model.safetensors:   0%|          | 0.00/7.26G [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "a5b23e2b1a3643ab9fa309be4cafcf64"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "stream",
-          "name": "stderr",
-          "text": [
-            "WARNING:auto_gptq.nn_modules.fused_llama_mlp:skip module injection for FusedLlamaMLPForQuantizedModel not support integrate without triton yet.\n"
-          ]
-        }
-      ]
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "#OpenAI Completion API\n",
-        "\n",
-        "prompt = \"\"\"\n",
-        "I have a clove of garlic, some brown rice, a few baby bok choy,\n",
-        "some olive oil, and a few slices of bacon.\n",
-        "How can I prepare a meal our of these ingredients?\n",
-        "\"\"\"\n",
-        "\n",
-        "input_prompts = [prompt]\n",
-        "num_tokens = asst.completion_tokens(input_prompts)\n",
-        "print(num_tokens[0])\n",
-        "\n",
-        "results = asst.completion(input_prompts)\n",
-        "print(results[0])"
-      ],
-      "metadata": {
-        "id": "UqprqtKi33IE",
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "outputId": "e87035e8-94ef-424e-d511-558aae1f371b"
+        "id": "NL3SY2o5gwNh"
       },
       "execution_count": null,
-      "outputs": [
-        {
-          "output_type": "stream",
-          "name": "stdout",
-          "text": [
-            "63\n",
-            "You can make a delicious and healthy meal using the following recipe:\n",
-            "\n",
-            "**Garlic Brown Rice with Baby Bok Choy and Bacon**\n",
-            "\n",
-            "Ingredients:\n",
-            "\n",
-            "* 1 clove garlic, minced\n",
-            "* 2 cups brown rice, rinsed\n",
-            "* 4 cups water or vegetable broth\n",
-            "* 1 tablespoon olive oil\n",
-            "* 3 baby bok choy, trimmed and halved\n",
-            "* 6-8 slices of bacon, diced\n",
-            "* Salt and pepper to taste\n",
-            "* Optional: soy sauce or other condiments for serving\n",
-            "\n",
-            "Instructions:\n",
-            "\n",
-            "1. Heat the olive oil in a large pan or Dutch oven over medium heat. Add the diced bacon and cook until it's crispy, about 5 minutes. Remove the bacon from the pan with a slotted spoon and set aside.\n",
-            "2. In the same pan, add the minced garlic and stir well. Cook for another minute until fragrant.\n",
-            "3. Pour in the rinsed brown rice and pour in enough water or broth to cover the grains by about an inch. Bring to a boil, then reduce the heat to low, cover the pan, and simmer for about 40 minutes or until all the liquid is absorbed and the rice is fully cooked.\n",
-            "4. Meanwhile, chop the baby bok choy into small pieces and set aside. Once the rice is done, add the baby bok choy to the pan along with a pinch of salt and pepper. Stir well and let cook for another 5 minutes, until the greens are tender but still slightly crisp.\n",
-            "5. Add the cooked bacon back to the pan and stir everything together. Taste and adjust seasonings as needed. Serve hot with soy sauce or any other desired condiments on the side. Enjoy!\n"
-          ]
-        }
-      ]
+      "outputs": []
     },
     {
       "cell_type": "code",
@@ -2746,66 +81,14 @@
         "    {\"role\": \"assistant\", \"content\": \"Hello, how are you?\"},\n",
         "    {\"role\": \"user\", \"content\": \"What should I do today?\"}\n",
         "]\n",
-        "num_tokens = asst.chat_completion_tokens(chat_history) #31\n",
+        "num_tokens = asst.chat_completion_tokens(chat_history) #29\n",
         "print(num_tokens)\n",
         "\n",
         "result = asst.chat_completion(chat_history, stream=True) #{'role': 'assistant', 'content': '1. Make a list of things to be grateful for.\\n2. Go outside and take a walk in nature.\\n3. Practice mindfulness meditation.\\n4. Connect with a loved one or friend.\\n5. Do something kind for someone else.\\n6. Engage in a creative activity like drawing or writing.\\n7. Read an uplifting book or listen to motivational podcasts.'}\n",
         "print(result[\"content\"])"
       ],
       "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "TWONAnBZeoSO",
-        "outputId": "8ca0e813-cbdb-4d65-fc0f-4691f2c06364"
-      },
-      "execution_count": null,
-      "outputs": [
-        {
-          "output_type": "stream",
-          "name": "stdout",
-          "text": [
-            "31\n",
-            "1. Start your day with a healthy breakfast to fuel your body and mind.\n",
-            "2. Make time for some form of physical activity, such as going for a walk or run, practicing yoga, or joining a fitness class.\n",
-            "3. Set small, achievable goals for the day and work towards them one step at a time.\n",
-            "4. Take breaks throughout the day to recharge and refocus.\n",
-            "5. Connect with friends, family, or loved ones through phone calls, video chats, or in-person visits if possible.\n",
-            "6. Find something that brings you joy and make time for it in your schedule.\n",
-            "7. Practice gratitude by reflecting on the positive aspects of your life.\n"
-          ]
-        }
-      ]
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "# Restart to free memory\n",
-        "import os\n",
-        "os._exit(00)"
-      ],
-      "metadata": {
-        "id": "9S_4wwnOhdOT"
-      },
-      "execution_count": null,
-      "outputs": []
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "# LangChain Completion API\n",
-        "from text2text.langchain.text2text_assistant import Text2TextAssistant\n",
-        "input_text = \"\"\"\n",
-        "I have a clove of garlic, some brown rice, a few baby bok choy,\n",
-        "some olive oil, and a few slices of bacon.\n",
-        "How can I prepare a meal our of these ingredients?\n",
-        "\"\"\"\n",
-        "llm = Text2TextAssistant()\n",
-        "result = llm(input_text)\n",
-        "print(result)"
-      ],
-      "metadata": {
-        "id": "Qjezr6cShbV8"
+        "id": "TWONAnBZeoSO"
       },
       "execution_count": null,
       "outputs": []
diff --git a/demos/[Text2Text]_Q&A_Assistant.ipynb b/demos/[Text2Text]_Q&A_Assistant.ipynb
deleted file mode 100644
index 6585c66..0000000
--- a/demos/[Text2Text]_Q&A_Assistant.ipynb
+++ /dev/null
@@ -1,4562 +0,0 @@
-{
-  "nbformat": 4,
-  "nbformat_minor": 0,
-  "metadata": {
-    "colab": {
-      "provenance": []
-    },
-    "kernelspec": {
-      "name": "python3",
-      "display_name": "Python 3"
-    },
-    "language_info": {
-      "name": "python"
-    },
-    "widgets": {
-      "application/vnd.jupyter.widget-state+json": {
-        "eff7cff5b7aa424bb3f3f6e85eb36802": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_92c1ec69856b4751a5e4d75f7715ee51",
-              "IPY_MODEL_49a35850f32e46a185107cb10abe2828",
-              "IPY_MODEL_e607e83a5a634d788ccf8700d0c8e469"
-            ],
-            "layout": "IPY_MODEL_2675f49667a34c0092b6bd76341e620f"
-          }
-        },
-        "92c1ec69856b4751a5e4d75f7715ee51": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_620ce963d9234dd3873b3ab2e33443fb",
-            "placeholder": "​",
-            "style": "IPY_MODEL_3f00e8d5a9e84a1aa33bc1d00c21585c",
-            "value": "Downloading (…)okenizer_config.json: 100%"
-          }
-        },
-        "49a35850f32e46a185107cb10abe2828": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_4a7348f188f641778f85bf7c82f8f85a",
-            "max": 272,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_526ad879567a431c89cb202234a50cb4",
-            "value": 272
-          }
-        },
-        "e607e83a5a634d788ccf8700d0c8e469": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_58e94f8f769b4a70a9705af2e1373812",
-            "placeholder": "​",
-            "style": "IPY_MODEL_6714031d895b4e0a9b54a72eaede5dfe",
-            "value": " 272/272 [00:00&lt;00:00, 16.9kB/s]"
-          }
-        },
-        "2675f49667a34c0092b6bd76341e620f": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "620ce963d9234dd3873b3ab2e33443fb": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "3f00e8d5a9e84a1aa33bc1d00c21585c": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "4a7348f188f641778f85bf7c82f8f85a": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "526ad879567a431c89cb202234a50cb4": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "58e94f8f769b4a70a9705af2e1373812": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "6714031d895b4e0a9b54a72eaede5dfe": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "d653c04371514a9e8879b75c52fb38a4": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_4c1bbbb1b29640839c4edf09fc478427",
-              "IPY_MODEL_a9f04bf31dd64d26afe4e1379f8df1ca",
-              "IPY_MODEL_8afa6fdefe534cbb8e5357b9f80f9e94"
-            ],
-            "layout": "IPY_MODEL_a4df6e3ef39e4f46b12f2f00d58d4893"
-          }
-        },
-        "4c1bbbb1b29640839c4edf09fc478427": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_3bc8485fb9c84f2184ca3225c6f89958",
-            "placeholder": "​",
-            "style": "IPY_MODEL_17db293d70814c4bbd8074b6cbc0fba5",
-            "value": "Downloading (…)lve/main/config.json: 100%"
-          }
-        },
-        "a9f04bf31dd64d26afe4e1379f8df1ca": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_3391f158249e4b42b7d4d1db07991c99",
-            "max": 908,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_5b64b25d544f40328ac6a8a6a52296a3",
-            "value": 908
-          }
-        },
-        "8afa6fdefe534cbb8e5357b9f80f9e94": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_51bc12386c154004b6d4c0419cb2dac2",
-            "placeholder": "​",
-            "style": "IPY_MODEL_4e6bb1b08d144febb86417aff2361aa2",
-            "value": " 908/908 [00:00&lt;00:00, 58.7kB/s]"
-          }
-        },
-        "a4df6e3ef39e4f46b12f2f00d58d4893": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "3bc8485fb9c84f2184ca3225c6f89958": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "17db293d70814c4bbd8074b6cbc0fba5": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "3391f158249e4b42b7d4d1db07991c99": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "5b64b25d544f40328ac6a8a6a52296a3": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "51bc12386c154004b6d4c0419cb2dac2": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "4e6bb1b08d144febb86417aff2361aa2": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "846f1b8542e5412980afa1be6ba84f94": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_cb704cff1aea41c080e82390eace27f9",
-              "IPY_MODEL_0d4a36501b8b4c07b1c712b9b15b708b",
-              "IPY_MODEL_80939a4d68e847c38f9438022cfbce11"
-            ],
-            "layout": "IPY_MODEL_e11784e667124b559fd49080ce25956f"
-          }
-        },
-        "cb704cff1aea41c080e82390eace27f9": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_3dca4fada1ea4157a94e7a4786094035",
-            "placeholder": "​",
-            "style": "IPY_MODEL_0807c26f42334a54995151120a5d567c",
-            "value": "Downloading (…)olve/main/vocab.json: "
-          }
-        },
-        "0d4a36501b8b4c07b1c712b9b15b708b": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_98d19a3ccbca474ea8b02f32600c6162",
-            "max": 1,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_4e200fd9464f4ef28e29ace85bf884f1",
-            "value": 1
-          }
-        },
-        "80939a4d68e847c38f9438022cfbce11": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_ca2ab7d87b9c46c78bda086eb98f3afd",
-            "placeholder": "​",
-            "style": "IPY_MODEL_aeff7c69f23d419c8ea84bd7cecdd067",
-            "value": " 3.71M/? [00:00&lt;00:00, 8.52MB/s]"
-          }
-        },
-        "e11784e667124b559fd49080ce25956f": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "3dca4fada1ea4157a94e7a4786094035": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "0807c26f42334a54995151120a5d567c": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "98d19a3ccbca474ea8b02f32600c6162": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": "20px"
-          }
-        },
-        "4e200fd9464f4ef28e29ace85bf884f1": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "ca2ab7d87b9c46c78bda086eb98f3afd": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "aeff7c69f23d419c8ea84bd7cecdd067": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "48fa9d5a07174331a0302db8b3612d22": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_43ea3e64865646859564c9eefcde0dca",
-              "IPY_MODEL_e11cf1359ddc41d7983b11d808dc7f04",
-              "IPY_MODEL_d992aaf5e2d247ad92aefbf4ea8b1ecb"
-            ],
-            "layout": "IPY_MODEL_b8aaae990f924e958c06f86230ecf544"
-          }
-        },
-        "43ea3e64865646859564c9eefcde0dca": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_378807cb2f1b4a1f96154c5d58982efd",
-            "placeholder": "​",
-            "style": "IPY_MODEL_d8e29999d727416a87ca29bd33a62fe3",
-            "value": "Downloading (…)tencepiece.bpe.model: 100%"
-          }
-        },
-        "e11cf1359ddc41d7983b11d808dc7f04": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_f1fc878dab3c4d47882830e7ba85fe07",
-            "max": 2423393,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_4e64cda115f141cf9c41b17605bd17be",
-            "value": 2423393
-          }
-        },
-        "d992aaf5e2d247ad92aefbf4ea8b1ecb": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_61a88f63605543ab99cada84889eb873",
-            "placeholder": "​",
-            "style": "IPY_MODEL_f2b231c0cad94e52b96b22aed686464d",
-            "value": " 2.42M/2.42M [00:00&lt;00:00, 32.4MB/s]"
-          }
-        },
-        "b8aaae990f924e958c06f86230ecf544": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "378807cb2f1b4a1f96154c5d58982efd": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "d8e29999d727416a87ca29bd33a62fe3": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "f1fc878dab3c4d47882830e7ba85fe07": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "4e64cda115f141cf9c41b17605bd17be": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "61a88f63605543ab99cada84889eb873": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "f2b231c0cad94e52b96b22aed686464d": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "80d058274b894dc39c2e15d523bbcdf2": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_c225b1215bd04fb0ac76f4be9aa8b20d",
-              "IPY_MODEL_3909d8568497453ea623f04816c594c5",
-              "IPY_MODEL_905078e7bb804232b6a2fa78bedf21fe"
-            ],
-            "layout": "IPY_MODEL_b14cef4febd842da93a828d217c80c0c"
-          }
-        },
-        "c225b1215bd04fb0ac76f4be9aa8b20d": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_37345ea89e864f4aa99cf0d4e06c9958",
-            "placeholder": "​",
-            "style": "IPY_MODEL_c8ad84ccdc5943a3a1b881088e86a178",
-            "value": "Downloading (…)cial_tokens_map.json: "
-          }
-        },
-        "3909d8568497453ea623f04816c594c5": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_94f9114b46cb40cfa23ab5b8d0dc2c6c",
-            "max": 1,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_d005528bc5ad45cdbc49d1c656e32371",
-            "value": 1
-          }
-        },
-        "905078e7bb804232b6a2fa78bedf21fe": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_3aed1774de704021b60126d1002c2f7e",
-            "placeholder": "​",
-            "style": "IPY_MODEL_e84f26306a8645c099459bf87e8b60ae",
-            "value": " 1.14k/? [00:00&lt;00:00, 77.8kB/s]"
-          }
-        },
-        "b14cef4febd842da93a828d217c80c0c": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "37345ea89e864f4aa99cf0d4e06c9958": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "c8ad84ccdc5943a3a1b881088e86a178": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "94f9114b46cb40cfa23ab5b8d0dc2c6c": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": "20px"
-          }
-        },
-        "d005528bc5ad45cdbc49d1c656e32371": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "3aed1774de704021b60126d1002c2f7e": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "e84f26306a8645c099459bf87e8b60ae": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "d381f49dfe8048a7af5aefb0ee040741": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_ec86759186874c50a4adbfb6247acf4d",
-              "IPY_MODEL_2c798aefc6df4f0f9d7f5f414286f8ec",
-              "IPY_MODEL_a9afb6e68a8d46c19c53f088c86335ee"
-            ],
-            "layout": "IPY_MODEL_ae9b2f296cb14e6cae6a4169768c4f90"
-          }
-        },
-        "ec86759186874c50a4adbfb6247acf4d": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_46648e5a0b9046e79ef5bfadd7997b9d",
-            "placeholder": "​",
-            "style": "IPY_MODEL_b7c146d1a8bd4885933127ee3e6b9b19",
-            "value": "Downloading (…)okenizer_config.json: 100%"
-          }
-        },
-        "2c798aefc6df4f0f9d7f5f414286f8ec": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_f42b0fc14b1643e3baf93c1d19dd305f",
-            "max": 727,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_7d979322f6164fe1ac49f53084d2041b",
-            "value": 727
-          }
-        },
-        "a9afb6e68a8d46c19c53f088c86335ee": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_6ee0643d819c4fb486efd6036cbeddc1",
-            "placeholder": "​",
-            "style": "IPY_MODEL_c0a72e00511a4be6b541b27a8a6d8f3c",
-            "value": " 727/727 [00:00&lt;00:00, 30.9kB/s]"
-          }
-        },
-        "ae9b2f296cb14e6cae6a4169768c4f90": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "46648e5a0b9046e79ef5bfadd7997b9d": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "b7c146d1a8bd4885933127ee3e6b9b19": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "f42b0fc14b1643e3baf93c1d19dd305f": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "7d979322f6164fe1ac49f53084d2041b": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "6ee0643d819c4fb486efd6036cbeddc1": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "c0a72e00511a4be6b541b27a8a6d8f3c": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "6a474a37559947e1b6887eb97349579b": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_6365e8ee3a3c4cf4b630f2f066edb640",
-              "IPY_MODEL_9ec277c0d5f84e87b950d7978f2e1d16",
-              "IPY_MODEL_fb4e4db16f1447de9a7716532d1ee121"
-            ],
-            "layout": "IPY_MODEL_cb1c0574043c40379270dcb688a1a071"
-          }
-        },
-        "6365e8ee3a3c4cf4b630f2f066edb640": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_d5285c2e94b84cf9b8196a32b464fcd5",
-            "placeholder": "​",
-            "style": "IPY_MODEL_a83003f2503747dd824d64e84b1b02cd",
-            "value": "Downloading tokenizer.model: 100%"
-          }
-        },
-        "9ec277c0d5f84e87b950d7978f2e1d16": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_339c160c8b3949138d9d38fd2221b480",
-            "max": 499723,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_3be4ea394736496da8af5972d6d29597",
-            "value": 499723
-          }
-        },
-        "fb4e4db16f1447de9a7716532d1ee121": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_172e4f67d9fa44eeb9bc9743845f7088",
-            "placeholder": "​",
-            "style": "IPY_MODEL_5c43853024ae47e891940ca3453f4986",
-            "value": " 500k/500k [00:00&lt;00:00, 23.0MB/s]"
-          }
-        },
-        "cb1c0574043c40379270dcb688a1a071": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "d5285c2e94b84cf9b8196a32b464fcd5": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "a83003f2503747dd824d64e84b1b02cd": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "339c160c8b3949138d9d38fd2221b480": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "3be4ea394736496da8af5972d6d29597": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "172e4f67d9fa44eeb9bc9743845f7088": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "5c43853024ae47e891940ca3453f4986": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "5e59f919b6d04fd987aa77f9cd599639": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_d1b3f0d8bdea4b43954afb02e9d64e37",
-              "IPY_MODEL_af7be8b78f644947bb6dcfc8b103e8d4",
-              "IPY_MODEL_d56cabd8b45d48f5b48302970ee5e5ee"
-            ],
-            "layout": "IPY_MODEL_c9586ab6d7f940df9d883afec02f0ae0"
-          }
-        },
-        "d1b3f0d8bdea4b43954afb02e9d64e37": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_031f55cdad89433191ba8e64a8f0bfd6",
-            "placeholder": "​",
-            "style": "IPY_MODEL_c31dcbbb1d9142409f31914517426317",
-            "value": "Downloading (…)/main/tokenizer.json: "
-          }
-        },
-        "af7be8b78f644947bb6dcfc8b103e8d4": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_65eb772b74f4472c9955fd6ad43f3a55",
-            "max": 1,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_63a0ab2ae6bb4ff4933e4fc79488461c",
-            "value": 1
-          }
-        },
-        "d56cabd8b45d48f5b48302970ee5e5ee": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_3d66d54105ca418d8a9743334e7ea542",
-            "placeholder": "​",
-            "style": "IPY_MODEL_d7fb3233be584eadbbeee71033e19cdc",
-            "value": " 1.84M/? [00:00&lt;00:00, 12.0MB/s]"
-          }
-        },
-        "c9586ab6d7f940df9d883afec02f0ae0": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "031f55cdad89433191ba8e64a8f0bfd6": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "c31dcbbb1d9142409f31914517426317": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "65eb772b74f4472c9955fd6ad43f3a55": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": "20px"
-          }
-        },
-        "63a0ab2ae6bb4ff4933e4fc79488461c": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "3d66d54105ca418d8a9743334e7ea542": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "d7fb3233be584eadbbeee71033e19cdc": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "5dcc71fd3ad24977a8e4952e921bfa99": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_af4881fd776740f09bc217d0ec41c39d",
-              "IPY_MODEL_24b4c64ce905487dbadd2b253920d1f2",
-              "IPY_MODEL_cfed6d309696487a935d9ed58862905b"
-            ],
-            "layout": "IPY_MODEL_94a631836f404e8c9e9d76c79ada3ba8"
-          }
-        },
-        "af4881fd776740f09bc217d0ec41c39d": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_21cfae05d95a434c8fdcff0ff20d8bea",
-            "placeholder": "​",
-            "style": "IPY_MODEL_5820e5d298ab4efca82a155cbf996ed3",
-            "value": "Downloading (…)cial_tokens_map.json: 100%"
-          }
-        },
-        "24b4c64ce905487dbadd2b253920d1f2": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_eeeff8f3e59a4021aac38efba58d1407",
-            "max": 435,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_b9c53c3aa7cf4d6296bb6a387d482c40",
-            "value": 435
-          }
-        },
-        "cfed6d309696487a935d9ed58862905b": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_13904a717a6a4385983c67d72ff27005",
-            "placeholder": "​",
-            "style": "IPY_MODEL_8375016e18c441668ee0acebf469f3a1",
-            "value": " 435/435 [00:00&lt;00:00, 19.2kB/s]"
-          }
-        },
-        "94a631836f404e8c9e9d76c79ada3ba8": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "21cfae05d95a434c8fdcff0ff20d8bea": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "5820e5d298ab4efca82a155cbf996ed3": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "eeeff8f3e59a4021aac38efba58d1407": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "b9c53c3aa7cf4d6296bb6a387d482c40": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "13904a717a6a4385983c67d72ff27005": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "8375016e18c441668ee0acebf469f3a1": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "f0b7c5bab36b4739aec4f50d265888d6": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_6738a4d03b2a49b1934a12bd225430c3",
-              "IPY_MODEL_6bc9a9c8cbfb48cdbffad258be7cea7e",
-              "IPY_MODEL_d6d6d54969ea400c94c01f3ea0e743df"
-            ],
-            "layout": "IPY_MODEL_ec613463fe2d4113acdca49c5bd744d7"
-          }
-        },
-        "6738a4d03b2a49b1934a12bd225430c3": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_550c2b9bf0a545e895acaa0ec39bb07b",
-            "placeholder": "​",
-            "style": "IPY_MODEL_337c3b4da86440a7a20323002fc3776f",
-            "value": "Downloading (…)lve/main/config.json: 100%"
-          }
-        },
-        "6bc9a9c8cbfb48cdbffad258be7cea7e": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_b79a6c9b6c9148c7a926d3165cd78ebc",
-            "max": 610,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_a0ae002757e34bf9a7f230634e337a67",
-            "value": 610
-          }
-        },
-        "d6d6d54969ea400c94c01f3ea0e743df": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_afb7169fcd694045aac0a9ddc76bb17b",
-            "placeholder": "​",
-            "style": "IPY_MODEL_95836c151f9f4f4584ebe030a12635d1",
-            "value": " 610/610 [00:00&lt;00:00, 24.8kB/s]"
-          }
-        },
-        "ec613463fe2d4113acdca49c5bd744d7": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "550c2b9bf0a545e895acaa0ec39bb07b": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "337c3b4da86440a7a20323002fc3776f": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "b79a6c9b6c9148c7a926d3165cd78ebc": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "a0ae002757e34bf9a7f230634e337a67": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "afb7169fcd694045aac0a9ddc76bb17b": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "95836c151f9f4f4584ebe030a12635d1": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "b1d88d12a969483fad417b8c5d0a42e5": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_a99ee85f298442818929941000c024bf",
-              "IPY_MODEL_baa387b4f7134e72840673b5cadaa2f9",
-              "IPY_MODEL_86c467aa60b54e3c97dd7a663e8181d8"
-            ],
-            "layout": "IPY_MODEL_025016437914428ebd1dcb2bd6241e66"
-          }
-        },
-        "a99ee85f298442818929941000c024bf": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_420bda82f1874625bc8fffc565f97160",
-            "placeholder": "​",
-            "style": "IPY_MODEL_d88f64fb9f9f42ac9f17afbeb220b2dc",
-            "value": "Downloading (…)quantize_config.json: 100%"
-          }
-        },
-        "baa387b4f7134e72840673b5cadaa2f9": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_901ed451a55c40e7a5cca33fb9631305",
-            "max": 135,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_daaccf4d3d3d404ca2a396ada98c5c7c",
-            "value": 135
-          }
-        },
-        "86c467aa60b54e3c97dd7a663e8181d8": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_9a81f891bff7434eb9cb39a4ce8f2e0b",
-            "placeholder": "​",
-            "style": "IPY_MODEL_764ffe09b8ab43eca349038e0db2828a",
-            "value": " 135/135 [00:00&lt;00:00, 7.03kB/s]"
-          }
-        },
-        "025016437914428ebd1dcb2bd6241e66": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "420bda82f1874625bc8fffc565f97160": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "d88f64fb9f9f42ac9f17afbeb220b2dc": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "901ed451a55c40e7a5cca33fb9631305": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "daaccf4d3d3d404ca2a396ada98c5c7c": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "9a81f891bff7434eb9cb39a4ce8f2e0b": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "764ffe09b8ab43eca349038e0db2828a": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "8f082b47a454430ba731829828e8ea0e": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HBoxModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HBoxModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HBoxView",
-            "box_style": "",
-            "children": [
-              "IPY_MODEL_cec6eb9318b349458270bdb9fed7d7de",
-              "IPY_MODEL_f44e515259104e83ab2f078be2631077",
-              "IPY_MODEL_6646c681271f41ff94771eaabd6cabc8"
-            ],
-            "layout": "IPY_MODEL_c30e852901bf41ee95affbebf4e93c70"
-          }
-        },
-        "cec6eb9318b349458270bdb9fed7d7de": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_62d433a4fbf14609a69167a1731e4ff7",
-            "placeholder": "​",
-            "style": "IPY_MODEL_ff668a7a34c5404fbe6eb8a2aeecc9d1",
-            "value": "Downloading (…)ct.order.safetensors: 100%"
-          }
-        },
-        "f44e515259104e83ab2f078be2631077": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "FloatProgressModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "FloatProgressModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "ProgressView",
-            "bar_style": "success",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_026c4dfde19a48d2b0067a4532a80cae",
-            "max": 7454797160,
-            "min": 0,
-            "orientation": "horizontal",
-            "style": "IPY_MODEL_7ec3e96e495a48f0aa8f70da1a7cfd93",
-            "value": 7454797160
-          }
-        },
-        "6646c681271f41ff94771eaabd6cabc8": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "HTMLModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_dom_classes": [],
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "HTMLModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/controls",
-            "_view_module_version": "1.5.0",
-            "_view_name": "HTMLView",
-            "description": "",
-            "description_tooltip": null,
-            "layout": "IPY_MODEL_e9bae720e4cb43bb80409ed5dda1a5fa",
-            "placeholder": "​",
-            "style": "IPY_MODEL_42023a93c3b449138512dd531a1e9b29",
-            "value": " 7.45G/7.45G [00:39&lt;00:00, 117MB/s]"
-          }
-        },
-        "c30e852901bf41ee95affbebf4e93c70": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "62d433a4fbf14609a69167a1731e4ff7": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "ff668a7a34c5404fbe6eb8a2aeecc9d1": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        },
-        "026c4dfde19a48d2b0067a4532a80cae": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "7ec3e96e495a48f0aa8f70da1a7cfd93": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "ProgressStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "ProgressStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "bar_color": null,
-            "description_width": ""
-          }
-        },
-        "e9bae720e4cb43bb80409ed5dda1a5fa": {
-          "model_module": "@jupyter-widgets/base",
-          "model_name": "LayoutModel",
-          "model_module_version": "1.2.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/base",
-            "_model_module_version": "1.2.0",
-            "_model_name": "LayoutModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "LayoutView",
-            "align_content": null,
-            "align_items": null,
-            "align_self": null,
-            "border": null,
-            "bottom": null,
-            "display": null,
-            "flex": null,
-            "flex_flow": null,
-            "grid_area": null,
-            "grid_auto_columns": null,
-            "grid_auto_flow": null,
-            "grid_auto_rows": null,
-            "grid_column": null,
-            "grid_gap": null,
-            "grid_row": null,
-            "grid_template_areas": null,
-            "grid_template_columns": null,
-            "grid_template_rows": null,
-            "height": null,
-            "justify_content": null,
-            "justify_items": null,
-            "left": null,
-            "margin": null,
-            "max_height": null,
-            "max_width": null,
-            "min_height": null,
-            "min_width": null,
-            "object_fit": null,
-            "object_position": null,
-            "order": null,
-            "overflow": null,
-            "overflow_x": null,
-            "overflow_y": null,
-            "padding": null,
-            "right": null,
-            "top": null,
-            "visibility": null,
-            "width": null
-          }
-        },
-        "42023a93c3b449138512dd531a1e9b29": {
-          "model_module": "@jupyter-widgets/controls",
-          "model_name": "DescriptionStyleModel",
-          "model_module_version": "1.5.0",
-          "state": {
-            "_model_module": "@jupyter-widgets/controls",
-            "_model_module_version": "1.5.0",
-            "_model_name": "DescriptionStyleModel",
-            "_view_count": null,
-            "_view_module": "@jupyter-widgets/base",
-            "_view_module_version": "1.2.0",
-            "_view_name": "StyleView",
-            "description_width": ""
-          }
-        }
-      }
-    },
-    "accelerator": "GPU",
-    "gpuClass": "standard"
-  },
-  "cells": [
-    {
-      "cell_type": "code",
-      "source": [
-        "%%bash\n",
-        "pip install -qq -U text2text"
-      ],
-      "metadata": {
-        "id": "iDnrMr7muLYN"
-      },
-      "execution_count": null,
-      "outputs": []
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "import requests\n",
-        "\n",
-        "def get_data(lang_code=\"en\"):\n",
-        "  url = f\"https://raw.githubusercontent.com/deepmind/xquad/master/xquad.{lang_code}.json\"\n",
-        "  r = requests.get(url)\n",
-        "  d = r.json()\n",
-        "  return [p[\"context\"].lower() for a in d[\"data\"] for p in a[\"paragraphs\"]]"
-      ],
-      "metadata": {
-        "id": "MnyW5sdNFTgD"
-      },
-      "execution_count": null,
-      "outputs": []
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "import text2text as t2t\n",
-        "#lang_codes = [\"en\",\"es\",\"de\",\"el\",\"ru\",\"tr\",\"ar\",\"vi\",\"th\",\"zh\",\"hi\",\"ro\"]\n",
-        "corpus = get_data(lang_code=\"en\")\n",
-        "index = t2t.Indexer().transform(corpus)\n",
-        "query = \"who did tesla partner with?\"\n",
-        "matching_docs = index.retrieve([query.lower()], k=1)\n",
-        "print(matching_docs)"
-      ],
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 231,
-          "referenced_widgets": [
-            "eff7cff5b7aa424bb3f3f6e85eb36802",
-            "92c1ec69856b4751a5e4d75f7715ee51",
-            "49a35850f32e46a185107cb10abe2828",
-            "e607e83a5a634d788ccf8700d0c8e469",
-            "2675f49667a34c0092b6bd76341e620f",
-            "620ce963d9234dd3873b3ab2e33443fb",
-            "3f00e8d5a9e84a1aa33bc1d00c21585c",
-            "4a7348f188f641778f85bf7c82f8f85a",
-            "526ad879567a431c89cb202234a50cb4",
-            "58e94f8f769b4a70a9705af2e1373812",
-            "6714031d895b4e0a9b54a72eaede5dfe",
-            "d653c04371514a9e8879b75c52fb38a4",
-            "4c1bbbb1b29640839c4edf09fc478427",
-            "a9f04bf31dd64d26afe4e1379f8df1ca",
-            "8afa6fdefe534cbb8e5357b9f80f9e94",
-            "a4df6e3ef39e4f46b12f2f00d58d4893",
-            "3bc8485fb9c84f2184ca3225c6f89958",
-            "17db293d70814c4bbd8074b6cbc0fba5",
-            "3391f158249e4b42b7d4d1db07991c99",
-            "5b64b25d544f40328ac6a8a6a52296a3",
-            "51bc12386c154004b6d4c0419cb2dac2",
-            "4e6bb1b08d144febb86417aff2361aa2",
-            "846f1b8542e5412980afa1be6ba84f94",
-            "cb704cff1aea41c080e82390eace27f9",
-            "0d4a36501b8b4c07b1c712b9b15b708b",
-            "80939a4d68e847c38f9438022cfbce11",
-            "e11784e667124b559fd49080ce25956f",
-            "3dca4fada1ea4157a94e7a4786094035",
-            "0807c26f42334a54995151120a5d567c",
-            "98d19a3ccbca474ea8b02f32600c6162",
-            "4e200fd9464f4ef28e29ace85bf884f1",
-            "ca2ab7d87b9c46c78bda086eb98f3afd",
-            "aeff7c69f23d419c8ea84bd7cecdd067",
-            "48fa9d5a07174331a0302db8b3612d22",
-            "43ea3e64865646859564c9eefcde0dca",
-            "e11cf1359ddc41d7983b11d808dc7f04",
-            "d992aaf5e2d247ad92aefbf4ea8b1ecb",
-            "b8aaae990f924e958c06f86230ecf544",
-            "378807cb2f1b4a1f96154c5d58982efd",
-            "d8e29999d727416a87ca29bd33a62fe3",
-            "f1fc878dab3c4d47882830e7ba85fe07",
-            "4e64cda115f141cf9c41b17605bd17be",
-            "61a88f63605543ab99cada84889eb873",
-            "f2b231c0cad94e52b96b22aed686464d",
-            "80d058274b894dc39c2e15d523bbcdf2",
-            "c225b1215bd04fb0ac76f4be9aa8b20d",
-            "3909d8568497453ea623f04816c594c5",
-            "905078e7bb804232b6a2fa78bedf21fe",
-            "b14cef4febd842da93a828d217c80c0c",
-            "37345ea89e864f4aa99cf0d4e06c9958",
-            "c8ad84ccdc5943a3a1b881088e86a178",
-            "94f9114b46cb40cfa23ab5b8d0dc2c6c",
-            "d005528bc5ad45cdbc49d1c656e32371",
-            "3aed1774de704021b60126d1002c2f7e",
-            "e84f26306a8645c099459bf87e8b60ae"
-          ]
-        },
-        "id": "Duu5XqIIq3cm",
-        "outputId": "32f93090-4537-46da-af39-1f3800812536"
-      },
-      "execution_count": null,
-      "outputs": [
-        {
-          "output_type": "stream",
-          "name": "stdout",
-          "text": [
-            "Better speed can be achieved with apex installed.\n"
-          ]
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)okenizer_config.json:   0%|          | 0.00/272 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "eff7cff5b7aa424bb3f3f6e85eb36802"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)lve/main/config.json:   0%|          | 0.00/908 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "d653c04371514a9e8879b75c52fb38a4"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)olve/main/vocab.json: 0.00B [00:00, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "846f1b8542e5412980afa1be6ba84f94"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)tencepiece.bpe.model:   0%|          | 0.00/2.42M [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "48fa9d5a07174331a0302db8b3612d22"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)cial_tokens_map.json: 0.00B [00:00, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "80d058274b894dc39c2e15d523bbcdf2"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "stream",
-          "name": "stdout",
-          "text": [
-            "[[\"after leaving edison's company tesla partnered with two businessmen in 1886, robert lane and benjamin vail, who agreed to finance an electric lighting company in tesla's name, tesla electric light & manufacturing. the company installed electrical arc light based illumination systems designed by tesla and also had designs for dynamo electric machine commutators, the first patents issued to tesla in the us.\"]]\n"
-          ]
-        }
-      ]
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "## Assistant uses pretrained knowledge if no knowledge base provided\n",
-        "assistant = t2t.Assistant()\n",
-        "assistant.transform([query])"
-      ],
-      "metadata": {
-        "id": "HjXp0eDbBz8C",
-        "colab": {
-          "base_uri": "https://localhost:8080/",
-          "height": 516,
-          "referenced_widgets": [
-            "d381f49dfe8048a7af5aefb0ee040741",
-            "ec86759186874c50a4adbfb6247acf4d",
-            "2c798aefc6df4f0f9d7f5f414286f8ec",
-            "a9afb6e68a8d46c19c53f088c86335ee",
-            "ae9b2f296cb14e6cae6a4169768c4f90",
-            "46648e5a0b9046e79ef5bfadd7997b9d",
-            "b7c146d1a8bd4885933127ee3e6b9b19",
-            "f42b0fc14b1643e3baf93c1d19dd305f",
-            "7d979322f6164fe1ac49f53084d2041b",
-            "6ee0643d819c4fb486efd6036cbeddc1",
-            "c0a72e00511a4be6b541b27a8a6d8f3c",
-            "6a474a37559947e1b6887eb97349579b",
-            "6365e8ee3a3c4cf4b630f2f066edb640",
-            "9ec277c0d5f84e87b950d7978f2e1d16",
-            "fb4e4db16f1447de9a7716532d1ee121",
-            "cb1c0574043c40379270dcb688a1a071",
-            "d5285c2e94b84cf9b8196a32b464fcd5",
-            "a83003f2503747dd824d64e84b1b02cd",
-            "339c160c8b3949138d9d38fd2221b480",
-            "3be4ea394736496da8af5972d6d29597",
-            "172e4f67d9fa44eeb9bc9743845f7088",
-            "5c43853024ae47e891940ca3453f4986",
-            "5e59f919b6d04fd987aa77f9cd599639",
-            "d1b3f0d8bdea4b43954afb02e9d64e37",
-            "af7be8b78f644947bb6dcfc8b103e8d4",
-            "d56cabd8b45d48f5b48302970ee5e5ee",
-            "c9586ab6d7f940df9d883afec02f0ae0",
-            "031f55cdad89433191ba8e64a8f0bfd6",
-            "c31dcbbb1d9142409f31914517426317",
-            "65eb772b74f4472c9955fd6ad43f3a55",
-            "63a0ab2ae6bb4ff4933e4fc79488461c",
-            "3d66d54105ca418d8a9743334e7ea542",
-            "d7fb3233be584eadbbeee71033e19cdc",
-            "5dcc71fd3ad24977a8e4952e921bfa99",
-            "af4881fd776740f09bc217d0ec41c39d",
-            "24b4c64ce905487dbadd2b253920d1f2",
-            "cfed6d309696487a935d9ed58862905b",
-            "94a631836f404e8c9e9d76c79ada3ba8",
-            "21cfae05d95a434c8fdcff0ff20d8bea",
-            "5820e5d298ab4efca82a155cbf996ed3",
-            "eeeff8f3e59a4021aac38efba58d1407",
-            "b9c53c3aa7cf4d6296bb6a387d482c40",
-            "13904a717a6a4385983c67d72ff27005",
-            "8375016e18c441668ee0acebf469f3a1",
-            "f0b7c5bab36b4739aec4f50d265888d6",
-            "6738a4d03b2a49b1934a12bd225430c3",
-            "6bc9a9c8cbfb48cdbffad258be7cea7e",
-            "d6d6d54969ea400c94c01f3ea0e743df",
-            "ec613463fe2d4113acdca49c5bd744d7",
-            "550c2b9bf0a545e895acaa0ec39bb07b",
-            "337c3b4da86440a7a20323002fc3776f",
-            "b79a6c9b6c9148c7a926d3165cd78ebc",
-            "a0ae002757e34bf9a7f230634e337a67",
-            "afb7169fcd694045aac0a9ddc76bb17b",
-            "95836c151f9f4f4584ebe030a12635d1",
-            "b1d88d12a969483fad417b8c5d0a42e5",
-            "a99ee85f298442818929941000c024bf",
-            "baa387b4f7134e72840673b5cadaa2f9",
-            "86c467aa60b54e3c97dd7a663e8181d8",
-            "025016437914428ebd1dcb2bd6241e66",
-            "420bda82f1874625bc8fffc565f97160",
-            "d88f64fb9f9f42ac9f17afbeb220b2dc",
-            "901ed451a55c40e7a5cca33fb9631305",
-            "daaccf4d3d3d404ca2a396ada98c5c7c",
-            "9a81f891bff7434eb9cb39a4ce8f2e0b",
-            "764ffe09b8ab43eca349038e0db2828a",
-            "8f082b47a454430ba731829828e8ea0e",
-            "cec6eb9318b349458270bdb9fed7d7de",
-            "f44e515259104e83ab2f078be2631077",
-            "6646c681271f41ff94771eaabd6cabc8",
-            "c30e852901bf41ee95affbebf4e93c70",
-            "62d433a4fbf14609a69167a1731e4ff7",
-            "ff668a7a34c5404fbe6eb8a2aeecc9d1",
-            "026c4dfde19a48d2b0067a4532a80cae",
-            "7ec3e96e495a48f0aa8f70da1a7cfd93",
-            "e9bae720e4cb43bb80409ed5dda1a5fa",
-            "42023a93c3b449138512dd531a1e9b29"
-          ]
-        },
-        "outputId": "716f5349-c2a6-44d6-feb6-c71e8789cc5f"
-      },
-      "execution_count": null,
-      "outputs": [
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)okenizer_config.json:   0%|          | 0.00/727 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "d381f49dfe8048a7af5aefb0ee040741"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading tokenizer.model:   0%|          | 0.00/500k [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "6a474a37559947e1b6887eb97349579b"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)/main/tokenizer.json: 0.00B [00:00, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "5e59f919b6d04fd987aa77f9cd599639"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)cial_tokens_map.json:   0%|          | 0.00/435 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "5dcc71fd3ad24977a8e4952e921bfa99"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)lve/main/config.json:   0%|          | 0.00/610 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "f0b7c5bab36b4739aec4f50d265888d6"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)quantize_config.json:   0%|          | 0.00/135 [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "b1d88d12a969483fad417b8c5d0a42e5"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "display_data",
-          "data": {
-            "text/plain": [
-              "Downloading (…)ct.order.safetensors:   0%|          | 0.00/7.45G [00:00<?, ?B/s]"
-            ],
-            "application/vnd.jupyter.widget-view+json": {
-              "version_major": 2,
-              "version_minor": 0,
-              "model_id": "8f082b47a454430ba731829828e8ea0e"
-            }
-          },
-          "metadata": {}
-        },
-        {
-          "output_type": "stream",
-          "name": "stderr",
-          "text": [
-            "WARNING:accelerate.utils.modeling:The model weights are not tied. Please use the `tie_weights` method before using the `infer_auto_device` function.\n",
-            "WARNING:accelerate.utils.modeling:The safetensors archive passed at /root/.cache/huggingface/hub/models--TheBloke--vicuna-13b-v1.3-GPTQ/snapshots/6fc0c550b624ceeb33a0ebe5d3e37cf13f5ce11c/vicuna-13b-v1.3-GPTQ-4bit-128g.no-act.order.safetensors does not contain metadata. Make sure to save your model with the `save_pretrained` method. Defaulting to 'pt' metadata.\n",
-            "WARNING:auto_gptq.nn_modules.fused_llama_mlp:skip module injection for FusedLlamaMLPForQuantizedModel not support integrate without triton yet.\n"
-          ]
-        },
-        {
-          "output_type": "execute_result",
-          "data": {
-            "text/plain": [
-              "[\"Tesla has partnered with several companies over the years for various purposes, including:\\n\\n1. Panasonic - In 2013, Tesla announced a partnership with Panasonic to produce lithium-ion battery cells for its electric vehicles at the Gigafactory in Nevada. The Gigafactory is a joint venture between Tesla and Panasonic that aims to reduce the cost of battery production and increase the world's supply of electric vehicle batteries.\\n2. Daimler AG - In 2017, Tesla announced a partnership with Daimler AG to develop and manufacture electric vehicles together. Under this agreement, Tesla would provide the electric powertrains for Mercedes-Benz's new EQC electric SUV, while Daimler would contribute its expertise in industrialization and production.\\n3. Toyota - In 2018, Tesla announced a partnership with Toyota to develop and produce electric vehicles. Under this agreement, the two companies would work together to develop a new electric vehicle using Tesla's powertrain technology, as well as sharing development costs.\\n4. AMD - In 2020, Tesla announced a partnership with AMD to develop custom ASIC chips for use in its Full Self-Driving (FSD) computer. These chips are designed to improve the performance and efficiency of the FSD computer, which is used in Tesla's Autopilot driver assistance system.\\n5. Cisco Systems - In 2020, Tesla announced a partnership with Cisco Systems to build a high-speed network infrastructure for its electric vehicles. This network will be used to enable fast, low-latency communication between Tesla's cars, allowing them to communicate with each other and with Tesla's data centers.\"]"
-            ]
-          },
-          "metadata": {},
-          "execution_count": 4
-        }
-      ]
-    },
-    {
-      "cell_type": "code",
-      "source": [
-        "assistant.transform([query], retriever=index)"
-      ],
-      "metadata": {
-        "id": "duuTC7hDB1nG",
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "outputId": "dc4c5158-5dab-4152-84ad-d976b41873c3"
-      },
-      "execution_count": null,
-      "outputs": [
-        {
-          "output_type": "execute_result",
-          "data": {
-            "text/plain": [
-              "['Tesla partnered with Robert Lane and Benjamin Vail.']"
-            ]
-          },
-          "metadata": {},
-          "execution_count": 5
-        }
-      ]
-    }
-  ]
-}
\ No newline at end of file
diff --git a/setup.py b/setup.py
index 2160beb..2139d56 100755
--- a/setup.py
+++ b/setup.py
@@ -5,7 +5,7 @@
 
 setuptools.setup(
   name="text2text",
-  version="1.3.8",
+  version="1.4.0",
   author="artitw",
   author_email="artitw@gmail.com",
   description="Text2Text: Crosslingual NLP/G toolkit",
@@ -18,7 +18,7 @@
     "License :: OSI Approved :: MIT License",
     "Operating System :: OS Independent",
   ],
-  keywords='multilingual crosslingual gpt chatgpt bert natural language processing nlp nlg text generation gpt question answer answering information retrieval tfidf tf-idf bm25 search index summary summarizer summarization tokenizer tokenization translation backtranslation data augmentation science machine learning colab embedding levenshtein sub-word edit distance conversational dialog chatbot',
+  keywords='multilingual crosslingual gpt chatgpt bert natural language processing nlp nlg text generation gpt question answer answering information retrieval tfidf tf-idf bm25 search index summary summarizer summarization tokenizer tokenization translation backtranslation data augmentation science machine learning colab embedding levenshtein sub-word edit distance conversational dialog chatbot mixtral',
   install_requires=[
     'accelerate',
     'auto-gptq',
@@ -37,5 +37,8 @@
     'torch',
     'tqdm',
     'transformers',
+    'hqq',
+    'tqdm',
+    'huggingface_hub'
   ],
 )
diff --git a/text2text/__init__.py b/text2text/__init__.py
index 949998d..8ec8b1e 100755
--- a/text2text/__init__.py
+++ b/text2text/__init__.py
@@ -16,4 +16,4 @@
 from .answerer import Answerer
 from .identifier import Identifier
 from .server import Server
-from .handler import Handler
+from .handler import Handler
\ No newline at end of file
diff --git a/text2text/assistant.py b/text2text/assistant.py
index 0d2e549..bd65f3a 100644
--- a/text2text/assistant.py
+++ b/text2text/assistant.py
@@ -1,111 +1,119 @@
-import logging
-import pandas as pd
-import text2text as t2t
-from transformers import AutoModelForCausalLM, AutoTokenizer, TextStreamer, logging
-
-logging.set_verbosity(logging.CRITICAL)
+import os
+import sys
+import torch
+from hqq.core.quantize import BaseQuantizeConfig
+from transformers import AutoConfig, AutoTokenizer
+from huggingface_hub import snapshot_download
+from .mixtral.build_model import OffloadConfig, QuantConfig, build_model
+from transformers import TextStreamer
 
 def _clean_output(input_prompt, output_text):
-  return output_text.replace('<s>',"").replace('</s>',"").replace(input_prompt, "").strip()
-
-class Assistant(t2t.Transformer):
+  input_prompt = input_prompt.replace('[INST]',' [INST] ').replace('  ',' ')
+  output_text = output_text.replace('[INST]',' [INST] ').replace('  ',' ')
+  return output_text.replace(input_prompt,"").replace('<s>',"").replace('</s>',"").strip()
 
+class Assistant(object):
   def __init__(self, **kwargs):
-    model_name_or_path = kwargs.get("model_name_or_path", "TheBloke/vicuna-13B-v1.5-16K-GPTQ")
-
-    self.__class__.tokenizer = AutoTokenizer.from_pretrained(model_name_or_path, use_fast=True, padding_side='left')
-
-    self.__class__.model = AutoModelForCausalLM.from_pretrained(model_name_or_path,
-                                             device_map="auto",
-                                             trust_remote_code=False,
-                                             revision="main")
-
-  def completion_preprocess(self, input_lines, retriever=None, **kwargs):
-    df = pd.DataFrame({"input_line": input_lines})
-    if retriever:
-      k = kwargs.get('k', 1)
-      df["knowledge"] = retriever.retrieve(df["input_line"].str.lower().tolist(), k=k)
-      df["input_line"] = df["knowledge"].apply(' '.join) + " - " + df["input_line"]
-    df["input_line"] = "USER: " + df["input_line"] + "\nASSISTANT:"
-    return df
-
-  def completion_tokens(self, input_lines):
-    df = self.completion_preprocess(input_lines)
-    tok = self.__class__.tokenizer
-    input_ids = tok(df["input_line"].tolist(), return_tensors="pt", padding=True).input_ids
-    return [len(x) for x in input_ids]
-
-  def transform(self, input_lines, retriever=None, **kwargs):
-    if isinstance(input_lines, str):
-      input_lines = [input_lines]
-    df = self.completion_preprocess(input_lines, retriever, **kwargs)
-    temperature = kwargs.get('temperature', 0.7)
-    top_p = kwargs.get('top_p', 0.95)
-    top_k = kwargs.get('top_k', 0)
-    repetition_penalty = kwargs.get('repetition_penalty', 1.15)
-    max_new_tokens = kwargs.get('max_new_tokens', 512)
-    tok = self.__class__.tokenizer
-    m = self.__class__.model
-
-    input_ids = tok(df["input_line"].tolist(), return_tensors="pt", padding=True).input_ids
-    input_ids = input_ids.to(m.device)
-    generate_kwargs = dict(
-        input_ids=input_ids,
-        max_new_tokens=max_new_tokens,
-        temperature=temperature,
-        do_sample=temperature > 0.0,
-        top_p=top_p,
-        top_k=top_k,
-        repetition_penalty=repetition_penalty,
+    os.environ["LC_ALL"] = "en_US.UTF-8"
+    os.environ["LD_LIBRARY_PATH"] = "/usr/lib64-nvidia"
+    os.environ["LIBRARY_PATH"] = "/usr/local/cuda/lib64/stubs"
+    os.system("ldconfig /usr/lib64-nvidia")
+
+    model_name = "Mixtral-8x7B-Instruct-v0.1-offloading-demo"
+    state_path = model_name
+    repo_id = f"lavawolfiee/{model_name}"
+    snapshot_download(repo_id=repo_id, local_dir=model_name)
+    config = AutoConfig.from_pretrained(model_name)
+    self.__class__.device = torch.device("cuda:0")
+
+    offload_per_layer = 4 # Change to 5 if only 12 GB of GPU VRAM
+
+    num_experts = config.num_local_experts
+
+    offload_config = OffloadConfig(
+        main_size=config.num_hidden_layers * (num_experts - offload_per_layer),
+        offload_size=config.num_hidden_layers * offload_per_layer,
+        buffer_size=4,
+        offload_per_layer=offload_per_layer,
+    )
+
+    attn_config = BaseQuantizeConfig(
+        nbits=4,
+        group_size=64,
+        quant_zero=True,
+        quant_scale=True,
     )
+    attn_config["scale_quant_params"]["group_size"] = 256
 
-    df["output_line"] = tok.batch_decode(m.generate(**generate_kwargs)) 
-    df["output_line"] = df.apply(lambda row: _clean_output(row["input_line"], row["output_line"]), axis=1)
 
-    return df["output_line"].tolist()
+    ffn_config = BaseQuantizeConfig(
+        nbits=2,
+        group_size=16,
+        quant_zero=True,
+        quant_scale=True,
+    )
+    quant_config = QuantConfig(ffn_config=ffn_config, attn_config=attn_config)
 
-  completion = transform
 
-  def chat_completion_preprocess(self, messages):
-    chat_history = [f'{line["role"].upper()}: {line["content"]}' for line in messages]
-    chat_history.append("ASSISTANT: ")
-    input_prompt = "\n".join(chat_history)
-    return input_prompt
+    self.__class__.model = build_model(
+        device=self.__class__.device,
+        quant_config=quant_config,
+        offload_config=offload_config,
+        state_path=state_path,
+    )
 
+    self.__class__.tokenizer = AutoTokenizer.from_pretrained(model_name)
+    self.__class__.streamer = TextStreamer(self.__class__.tokenizer, skip_prompt=True, skip_special_tokens=True)
+    self.__class__.cache = {}
+  
   def chat_completion_tokens(self, messages):
-    input_prompt = self.chat_completion_preprocess(messages)
-    tok = self.__class__.tokenizer
-    input_ids = tok([input_prompt], return_tensors="pt", padding=True).input_ids[0]
-    return len(input_ids)
-
-  def chat_completion(self, messages, **kwargs):
-    input_prompt = self.chat_completion_preprocess(messages)
-      
-    temperature = kwargs.get('temperature', 0.7)
-    top_p = kwargs.get('top_p', 0.95)
-    top_k = kwargs.get('top_k', 0)
-    repetition_penalty = kwargs.get('repetition_penalty', 1.15)
-    max_new_tokens = kwargs.get('max_new_tokens', 512)
-    stream = kwargs.get('stream', False)
-    tok = self.__class__.tokenizer
-    m = self.__class__.model
-    streamer = TextStreamer(tok, skip_prompt=True, skip_special_tokens=True) if stream else None
-
-    input_ids = tok([input_prompt], return_tensors="pt", padding=True).input_ids
-    input_ids = input_ids.to(m.device)
-    generate_kwargs = dict(
-        input_ids=input_ids,
-        streamer=streamer,
-        max_new_tokens=max_new_tokens,
-        temperature=temperature,
-        do_sample=temperature > 0.0,
-        top_p=top_p,
-        top_k=top_k,
-        repetition_penalty=repetition_penalty,
+    tokenizer = self.__class__.tokenizer
+    device = self.__class__.device
+    input_ids = tokenizer.apply_chat_template(messages, return_tensors="pt").to(device)
+    return len(input_ids[0])
+
+  def chat_completion(self, messages=[{"role": "user", "content": "hello"}], stream=True, **kwargs):
+    tokenizer = self.__class__.tokenizer
+    cache = self.__class__.cache
+    device = self.__class__.device
+    streamer = self.__class__.streamer
+    model = self.__class__.model
+
+    input_ids = tokenizer.apply_chat_template(messages, return_tensors="pt").to(device)
+
+    input_string = tokenizer.apply_chat_template(messages, tokenize=False)
+
+    past_key_values = cache.get(input_string, None)
+    if past_key_values:
+      seq_len = input_ids.size(1) + past_key_values[0][0][0].size(1)
+      attention_mask = torch.ones([1, seq_len - 1], dtype=torch.int, device=device)
+    else:
+      attention_mask = torch.ones_like(input_ids)
+
+    results = model.generate(
+      input_ids=input_ids,
+      attention_mask=attention_mask,
+      past_key_values=past_key_values,
+      streamer=streamer if stream else None,
+      do_sample=kwargs.get("do_sample", True),
+      temperature=kwargs.get("temperature", 0.9),
+      top_p=kwargs.get("top_p", 0.9),
+      max_new_tokens=kwargs.get("max_new_tokens", 512),
+      pad_token_id=tokenizer.eos_token_id,
+      return_dict_in_generate=True,
+      output_hidden_states=False,
     )
-    
-    results = tok.batch_decode(m.generate(**generate_kwargs))[0]
+
+    cache[input_string] = results["past_key_values"]
+
+    results = tokenizer.batch_decode(**results)[0]
+
     return {
       "role": "assistant",
-      "content": _clean_output(input_prompt, results)
+      "content": _clean_output(input_string, results)
     }
+
+    return results
+
+  def transform(self, input_lines, src_lang='en', **kwargs):
+    return self.chat_completion([{"role": "user", "content": input_lines}])
\ No newline at end of file
diff --git a/text2text/langchain/test_text2text_assistant.py b/text2text/langchain/test_text2text_assistant.py
index 19684a4..14d6065 100644
--- a/text2text/langchain/test_text2text_assistant.py
+++ b/text2text/langchain/test_text2text_assistant.py
@@ -7,4 +7,4 @@ def test_llm_inference() -> None:
     input_text = 'Say "hello, world" back to me'
     llm = Text2TextAssistant()
     result = llm(input_text)
-    assert "hello" in result.lower() 
+    assert "hello" in result.lower() 
\ No newline at end of file
diff --git a/text2text/langchain/text2text_assistant.py b/text2text/langchain/text2text_assistant.py
index 30072fe..fa3f93a 100644
--- a/text2text/langchain/text2text_assistant.py
+++ b/text2text/langchain/text2text_assistant.py
@@ -20,7 +20,7 @@ def _call(
     ) -> str:
         if stop is not None:
             raise ValueError("stop kwargs are not permitted.")
-        return self.model.transform([prompt], **kwargs)[0]
+        return self.model.transform(messages=[{"role": "user", "content": prompt}], **kwargs)["content"]
 
     @property
     def _identifying_params(self) -> Mapping[str, Any]:
diff --git a/text2text/mixtral/build_model.py b/text2text/mixtral/build_model.py
new file mode 100644
index 0000000..09d3b16
--- /dev/null
+++ b/text2text/mixtral/build_model.py
@@ -0,0 +1,263 @@
+# MIT License
+#
+# Copyright (c) 2023 Artyom Eliseev, Denis Mazur
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+import os
+import json
+from functools import cache
+from dataclasses import dataclass
+import typing as tp
+
+import torch
+from torch import nn
+
+from transformers import AutoConfig
+from transformers.models.mixtral import MixtralForCausalLM, MixtralConfig
+
+from safetensors.torch import load_file
+
+from torch import nn
+from tqdm.auto import trange
+
+from hqq.core.quantize import BaseQuantizeConfig
+
+from .expert_cache import ExpertCache
+from .expert_wrapper import MixtralExpertWrapper
+from .custom_layers import (
+    HQQLinearTritonSavable,
+    MixtralBLockSparseTop2MLP_HQQ,
+    SparseMoeWrapper,
+)
+from .utils import with_default_dtype
+
+
+@dataclass(frozen=True)
+class OffloadConfig:
+    main_size: int
+    offload_size: int
+    buffer_size: int
+    offload_per_layer: int
+
+
+class QuantConfig:
+    def __init__(
+        self,
+        ffn_config: BaseQuantizeConfig,
+        attn_config: BaseQuantizeConfig,
+    ):
+        self.ffn_config = ffn_config
+        self.attn_config = attn_config
+
+    @cache
+    def get_ffn_metas(self, hidden_dim: int, ffn_dim: int) -> tuple[tp.Any, tp.Any]:
+        return (
+            HQQLinearTritonSavable.get_hqq_meta((hidden_dim, ffn_dim), self.ffn_config),
+            HQQLinearTritonSavable.get_hqq_meta((ffn_dim, hidden_dim), self.ffn_config),
+        )
+
+
+def replace_attn_layers(
+    model: MixtralForCausalLM,
+    config: MixtralConfig,
+    quant_config: QuantConfig,
+    device: torch.device,
+) -> None:
+    attn_quant_config = quant_config.attn_config
+
+    hidden_size = config.hidden_size
+    num_heads = config.num_attention_heads
+    head_dim = hidden_size // num_heads
+    num_key_value_heads = config.num_key_value_heads
+
+    shapes = [
+        (hidden_size, num_heads * head_dim),
+        (hidden_size, num_key_value_heads * head_dim),
+        (hidden_size, num_key_value_heads * head_dim),
+        (num_heads * head_dim, hidden_size),
+    ]
+
+    shape_to_meta = {
+        shape: HQQLinearTritonSavable.get_hqq_meta(shape, attn_quant_config)
+        for shape in shapes
+    }
+
+    def patch_fct_hqq(shape, quant_config):
+        meta = shape_to_meta[shape]
+        layer = HQQLinearTritonSavable(None, quant_config, meta=meta)
+        return layer
+
+    for layer in model.model.layers:
+        layer.block_sparse_moe.gate = nn.Linear(
+            config.hidden_size,
+            config.num_local_experts,
+            dtype=torch.float16,
+            device=device,
+            bias=False,
+        )
+
+        layer.self_attn.q_proj = patch_fct_hqq(
+            (hidden_size, num_heads * head_dim), attn_quant_config
+        )
+        layer.self_attn.k_proj = patch_fct_hqq(
+            (hidden_size, num_key_value_heads * head_dim), attn_quant_config
+        )
+        layer.self_attn.v_proj = patch_fct_hqq(
+            (hidden_size, num_key_value_heads * head_dim), attn_quant_config
+        )
+        layer.self_attn.o_proj = patch_fct_hqq(
+            (hidden_size, num_heads * head_dim), attn_quant_config
+        )
+
+
+@cache
+def get_default_ffn_quant_config(ffn_dim: int = 14336, hidden_dim: int = 4096):
+    quant_config = BaseQuantizeConfig(
+        nbits=2,
+        group_size=16,
+        quant_zero=True,
+        quant_scale=True,
+    )
+
+    meta1 = HQQLinearTritonSavable.get_hqq_meta((hidden_dim, ffn_dim), quant_config)
+    meta2 = HQQLinearTritonSavable.get_hqq_meta((ffn_dim, hidden_dim), quant_config)
+
+    return quant_config, meta1, meta2
+
+
+def make_empty_expert(
+    model_config: MixtralConfig, quant_config: QuantConfig
+) -> MixtralBLockSparseTop2MLP_HQQ:
+    meta1, meta2 = quant_config.get_ffn_metas(
+        model_config.hidden_size, model_config.intermediate_size
+    )
+    return MixtralBLockSparseTop2MLP_HQQ(
+        model_config,
+        quant_config.ffn_config,
+        meta1,
+        meta2,
+    )
+
+
+def make_and_load_expert_wrapper(
+    config: MixtralConfig,
+    quant_config: QuantConfig,
+    states_dir: str,
+    expert_uid: tuple[int, int],
+    device: torch.device,
+) -> MixtralExpertWrapper:
+    layer_idx, expert_idx = expert_uid
+
+    index_path = os.path.join(states_dir, "model.safetensors.index.json")
+    with open(index_path) as f:
+        module_idx = f"model.layers.{layer_idx}.block_sparse_moe.experts.{expert_idx}"
+        state_fpath = json.load(f)["weight_map"][f"{module_idx}.w1.W_q"]
+
+    state_dict = load_file(os.path.join(states_dir, state_fpath), device=str(device))
+    expert = make_empty_expert(config, quant_config)
+    expert.load_state_dict(state_dict, strict=True)
+
+    return MixtralExpertWrapper(expert, device)
+
+
+def load_00_expert_state_dict(states_dir: str, device: torch.device):
+    index_path = os.path.join(states_dir, "model.safetensors.index.json")
+    with open(index_path) as f:
+        module_idx = f"model.layers.0.block_sparse_moe.experts.0"
+        state_fpath = json.load(f)["weight_map"][f"{module_idx}.w1.W_q"]
+    return load_file(os.path.join(states_dir, state_fpath), device=str(device))
+
+
+def build_model(
+    device: torch.device,
+    quant_config: QuantConfig,
+    offload_config: OffloadConfig,
+    state_path: str,
+):
+    model_name = "mistralai/Mixtral-8x7B-Instruct-v0.1"
+
+    state_dict_00 = load_00_expert_state_dict(state_path, device)
+
+    def _make_module():
+        config = AutoConfig.from_pretrained(model_name)
+        expert = make_empty_expert(config, quant_config)
+        expert.load_state_dict(state_dict_00)
+        return MixtralExpertWrapper(expert, device=device)
+
+    with device, with_default_dtype(torch.float16):
+        model = MixtralForCausalLM(
+            AutoConfig.from_pretrained(
+                model_name,
+                num_local_experts=0,
+                torch_dtype=torch.float16,
+                device_map=device,
+            ),
+        )
+
+    model_config = AutoConfig.from_pretrained(model_name)
+    replace_attn_layers(model, model_config, quant_config, device)
+    state_index_path = os.path.join(state_path, "model.safetensors.index.json")
+    with open(state_index_path) as f:
+        weight_map = json.load(f)["weight_map"]
+
+    trunk_state_path = os.path.join(
+        state_path,
+        weight_map["model.embed_tokens.weight"],
+    )
+    model.load_state_dict(load_file(trunk_state_path, device=str(device)), strict=True)
+
+    expert_cache = ExpertCache(
+        make_module=_make_module,
+        main_size=offload_config.main_size,
+        offload_size=offload_config.offload_size,
+        buffer_size=offload_config.buffer_size,
+    )
+    for layer_idx in trange(model_config.num_hidden_layers, desc="Loading experts"):
+        curr_layer = model.model.layers[layer_idx]
+        curr_layer.block_sparse_moe = SparseMoeWrapper(
+            model_config,
+            layer_idx,
+            curr_layer.block_sparse_moe.gate,
+            expert_cache,
+        )
+
+        for expert_idx in range(model_config.num_local_experts):
+            do_offload = expert_idx < offload_config.offload_per_layer
+
+            expert_wrapper = make_and_load_expert_wrapper(
+                config=model_config,
+                quant_config=quant_config,
+                states_dir=state_path,
+                expert_uid=(layer_idx, expert_idx),
+                device=device,
+            )
+
+            expert_cache.add_expert(
+                uid=(layer_idx, expert_idx),
+                module=expert_wrapper,
+                eviction_group=layer_idx,
+                offload=do_offload,
+            )
+
+            del expert_wrapper
+            torch.cuda.synchronize(device)
+            torch.cuda.empty_cache()
+
+    return model
\ No newline at end of file
diff --git a/text2text/mixtral/custom_layers.py b/text2text/mixtral/custom_layers.py
new file mode 100644
index 0000000..8909d17
--- /dev/null
+++ b/text2text/mixtral/custom_layers.py
@@ -0,0 +1,336 @@
+# MIT License
+#
+# Copyright (c) 2023 Artyom Eliseev, Denis Mazur
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+import copy
+import functools
+from transformers.models.mixtral.configuration_mixtral import MixtralConfig
+from transformers.activations import ACT2FN
+from typing import Dict, Any
+from hqq.core.quantize import HQQLinear, Quantizer
+
+import torch
+from torch import nn
+from torch.nn import functional as F
+
+from .packing import pack_4bit_u8_common, pack_2bit_u8_common, unpack_4bit_u8_common, unpack_2bit_u8_common
+from .triton_kernels import triton_matmul4_transpose, triton_matmul3_transpose, triton_matmul2_transpose
+
+
+class HQQLinearTritonSavable(HQQLinear):
+    def __init__(self, layer, quant_config, meta=None, **kwargs):
+        """
+        Example how to get meta:
+        >>>> meta1 = HQQLinearSavable.get_hqq_meta((hidden_dim, ffn_dim), quant_config)
+        >>>> meta2 = HQQLinearSavable.get_hqq_meta((ffn_dim, hidden_dim), quant_config)
+        """
+        
+        assert quant_config['weight_quant_params']['nbits'] in [2, 3, 4]
+        
+        super().__init__(layer, quant_config, **kwargs)
+        
+        if not hasattr(self, 'meta'):
+            assert meta is not None
+            self.meta = copy.deepcopy(meta)
+        
+        self._register_state_dict_hook(self._add_to_state_dict_hook)
+        self._register_load_state_dict_pre_hook(self._load_from_state_dict_hook)
+    
+    def quantize(self, *args, **kwargs):
+        super().quantize(*args, **kwargs)
+        
+        # repacking
+        self.repack()
+    
+    def repack(self):
+        if self.W_q.shape != self.meta['shape']:
+            W_q = Quantizer.unpack[self.meta['packing']](self.W_q)
+            sh = self.meta['shape']
+            W_q = W_q.reshape((-1,) + sh[1:])
+            W_q = W_q[:sh[0], ...]
+            self.W_q = Quantizer.pack[self.meta['packing']](W_q)
+    
+    def forward(self, x):
+        return self.forward_triton(x)
+    
+    def set_backend(self, backend):
+        pass
+    
+    @torch.inference_mode()
+    def forward_triton(self, x):
+        assert self.ready, "model was not quantized"
+        assert self.meta['axis'] == 0
+
+        W_q, meta = self.W_q, self.meta
+
+        del_keys = []
+        if 'quant_scale' in meta and meta['quant_scale']:
+            meta['scale'] = Quantizer.dequantize(meta['scale_q'], meta['meta_scale']); del_keys.append('scale')
+        if 'quant_zero' in meta and meta['quant_zero']:
+            meta['zero']  = Quantizer.dequantize(meta['zero_q'],  meta['meta_zero']);  del_keys.append('zero')
+
+        K = meta['shape'][1]
+        N = meta['shape'][0]
+        
+        if self.meta['nbits'] == 4:
+            fn = triton_matmul4_transpose
+        elif self.meta['nbits'] == 3:
+            fn = functools.partial(triton_matmul3_transpose, N=N)
+        elif self.meta['nbits'] == 2:
+            fn = triton_matmul2_transpose
+        else:
+            raise RuntimeError(f"nbits == {self.meta['nbits']} isn't yet supported")
+        
+        output = fn(
+            meta['group_size'], x,
+            W_q.view(-1, K),
+            meta['scale'].view(-1, K),
+            meta['zero'].view(-1, K),
+            bias=self.bias if hasattr(self, 'bias') else None,
+        )
+
+        #Cleanup
+        for key in del_keys:
+            del meta[key]
+
+        return output
+
+    # to support .forward_pytorch(...) - backward compatibility
+    @torch.inference_mode()
+    def dequantize(self):
+        assert self.ready, "model was not quantized"
+        W_q, meta = self.W_q, self.meta
+        del_keys = []
+        if(meta['quant_scale']):
+            meta['scale'] = Quantizer.dequantize(meta['scale_q'], meta['meta_scale']); del_keys.append('scale')
+        if(meta['quant_zero']):
+            meta['zero']  = Quantizer.dequantize(meta['zero_q'],  meta['meta_zero']);  del_keys.append('zero')
+        
+        W_q_p = Quantizer.unpack[meta['packing']](W_q).half()
+        W_q_p = W_q_p[:meta['shape'][0], ...]
+        W_q_p = W_q_p.reshape((meta['group_size'], -1))
+    
+        if((meta['group_size'] is not None) and (meta['nbits']==3)):
+            W_q_p = W_q_p[:meta['group_size']] if (meta['axis']==0) else W_q_p[:,:meta['group_size']]
+        W_est = ((W_q_p - meta['zero'])*meta['scale']).reshape(meta['shape']) 
+        
+        #Cleanup
+        del W_q_p
+        for key in del_keys: del meta[key]
+        return W_est
+    
+    @classmethod
+    def get_hqq_meta(cls, linear_shape, quant_config):
+        layer = HQQLinear(nn.Linear(*linear_shape, bias=False), quant_config)
+        meta = layer.meta
+
+        def _remove_tensors_recursive(d):
+            keys = list(d.keys())
+
+            for k in keys:
+                if isinstance(d[k], torch.Tensor):
+                    del d[k]
+                elif isinstance(d[k], dict):
+                    _remove_tensors_recursive(d[k])
+
+        _remove_tensors_recursive(meta)
+
+        return meta
+        
+    @staticmethod
+    def _add_to_state_dict_hook(self, state_dict, prefix, local_metadata):
+        tensor_paths = self._get_tensor_paths(self.meta)
+        assert set(tensor_paths).issubset(
+            {'scale_q', 'meta_scale.scale', 'meta_scale.zero', 'zero_q', 'meta_zero.scale', 'meta_zero.zero',
+            'scale', 'zero'}
+        )
+        
+        def _add(name, value):
+            state_dict[prefix + name] = value
+        
+        _add('W_q', self.W_q)
+        
+        if self.bias is not None:
+            _add('bias', self.bias)
+        
+        if 'meta_scale' in self.meta:
+            _add('meta.scale_q', self.meta['scale_q'])
+            _add('meta.meta_scale.scale', self.meta['meta_scale']['scale'])
+            _add('meta.meta_scale.zero', self.meta['meta_scale']['zero'])
+        else:
+            _add('meta.scale', self.meta['scale'])
+        
+        if 'meta_zero' in self.meta:
+            _add('meta.zero_q', self.meta['zero_q'])
+            _add('meta.meta_zero.scale', self.meta['meta_zero']['scale'])
+            _add('meta.meta_zero.zero', self.meta['meta_zero']['zero'])
+        else:
+            _add('meta.zero', self.meta['zero'])
+        
+        return state_dict
+    
+    def _load_from_state_dict_hook(self, state_dict, prefix, local_metadata, strict, missing_keys, unexpected_keys, error_msgs):
+        tensor_paths = [k[len(prefix + 'meta.'):] for k in state_dict.keys() if k.startswith(prefix + 'meta.')]
+        assert set(tensor_paths).issubset(
+            {'scale_q', 'meta_scale.scale', 'meta_scale.zero', 'zero_q', 'meta_zero.scale', 'meta_zero.zero',
+            'scale', 'zero'}
+        )
+        
+        def _del(name):
+            del state_dict[prefix + name]
+        def _set(name):
+            setattr(self, name, state_dict[prefix + name])
+            _del(name)
+        def _get(name):
+            v = state_dict[prefix + name]
+            _del(name)
+            return v
+        
+        _set('W_q')
+        if 'bias' in state_dict:
+            _set('bias')
+        else:
+            self.bias = None
+            
+        if not hasattr(self, 'meta'):
+            self.meta = {}
+        
+        if (prefix + 'meta.meta_scale.scale') in state_dict:
+            self.meta['scale_q'] = _get('meta.scale_q')
+            self.meta['quant_scale'] = True
+            if not 'meta_scale' in self.meta:
+                self.meta['meta_scale'] = {}
+            self.meta['meta_scale'] |= {
+                'scale': _get('meta.meta_scale.scale'),
+                'zero': _get('meta.meta_scale.zero')
+            }
+        else:
+            self.meta['scale'] = _get('meta.scale')
+        if (prefix + 'meta.meta_zero.scale') in state_dict:
+            self.meta['zero_q'] = _get('meta.zero_q')
+            self.meta['quant_zero'] = True
+            if not 'meta_zero' in self.meta:
+                self.meta['meta_zero'] = {}
+            self.meta['meta_zero'] |= {
+                'scale': _get('meta.meta_zero.scale'),
+                'zero': _get('meta.meta_zero.zero')
+            }
+        else:
+            self.meta['zero'] = _get('meta.zero')
+        self.ready = True
+        
+        # self.cuda()
+        # self.in_gpu = self.W_q.device.type == 'cuda'
+        # assert self.in_gpu
+        
+        self.repack()
+        
+    @classmethod
+    def _get_tensor_paths(cls, state: Dict[str, Any], prefix=''):
+        paths = []
+        
+        for k, v in state.items():
+            if isinstance(v, dict):
+                paths += cls._get_tensor_paths(v, prefix=k + '.')
+            elif isinstance(v, torch.Tensor):
+                paths.append(prefix + k)
+        
+        return paths
+    
+    def state_dict(self, *args, **kwargs):
+        return nn.Module.state_dict(self, *args, **kwargs)
+    
+    def load_state_dict(self, *args, **kwargs):
+        nn.Module.load_state_dict(self, *args, **kwargs)
+
+
+class MixtralBLockSparseTop2MLP_HQQ(nn.Module):
+    def __init__(self, config: MixtralConfig, quant_config: Dict[str, Any], meta1, meta2):
+        super().__init__()
+        
+        self.w1 = HQQLinearTritonSavable(None, quant_config, meta1)
+        self.w2 = HQQLinearTritonSavable(None, quant_config, meta2)
+        self.w3 = HQQLinearTritonSavable(None, quant_config, meta1)
+
+        self.act_fn = ACT2FN[config.hidden_act]
+
+    def forward(self, hidden_states):
+        current_hidden_states = self.act_fn(self.w1(hidden_states)) * self.w3(hidden_states)
+        current_hidden_states = self.w2(current_hidden_states)
+        return current_hidden_states
+
+
+class SparseMoeWrapper(nn.Module):
+    def __init__(self, config, layer_id, gate, expert_cache):
+        super().__init__()
+
+        self.hidden_dim = config.hidden_size
+        self.ffn_dim = config.intermediate_size
+        self.num_experts = config.num_local_experts
+        self.top_k = config.num_experts_per_tok
+        self.layer_id = layer_id
+
+        self.gate = gate
+        self.experts = expert_cache
+
+    def forward(self, hidden_states: torch.Tensor) -> torch.Tensor:
+        batch_size, sequence_length, hidden_dim = hidden_states.shape
+        hidden_states = hidden_states.view(-1, hidden_dim)
+        # router_logits: (batch * sequence_length, n_experts)
+        router_logits = self.gate(hidden_states)
+
+        routing_weights = F.softmax(router_logits, dim=1, dtype=torch.float)
+        routing_weights, selected_experts = torch.topk(routing_weights, self.top_k, dim=-1)
+        routing_weights /= routing_weights.sum(dim=-1, keepdim=True)
+        # we cast back to the input dtype
+        routing_weights = routing_weights.to(hidden_states.dtype)
+
+        final_hidden_states = torch.zeros(
+            (batch_size * sequence_length, hidden_dim), dtype=hidden_states.dtype, device=hidden_states.device
+        )
+
+        # One hot encode the selected experts to create an expert mask
+        # this will be used to easily index which expert is going to be sollicitated
+        expert_mask = torch.nn.functional.one_hot(selected_experts, num_classes=self.num_experts).permute(2, 1, 0)
+
+        active_experts = selected_experts.flatten().unique().tolist()
+
+        # Loop over all available experts in the model and perform the computation on each expert
+        for (_layer_index, expert_idx), expert_layer in self.experts.load_experts(
+                *((self.layer_id, expert_idx) for expert_idx in active_experts), unordered=True):
+            idx, top_x = torch.where(expert_mask[expert_idx])
+            assert top_x.shape[0] > 0
+
+            # in torch it is faster to index using lists than torch tensors
+            top_x_list = top_x.tolist()
+            idx_list = idx.tolist()
+
+            # Index the correct hidden states and compute the expert hidden state for
+            # the current expert. We need to make sure to multiply the output hidden
+            # states by `routing_weights` on the corresponding tokens (top-1 and top-2)
+            current_state = hidden_states[None, top_x_list].reshape(-1, hidden_dim)
+            current_hidden_states = expert_layer(current_state) * routing_weights[top_x_list, idx_list, None]
+
+            # However `index_add_` only support torch tensors for indexing so we'll use
+            # the `top_x` tensor here.
+            final_hidden_states.index_add_(0, top_x, current_hidden_states.to(hidden_states.dtype))
+        final_hidden_states = final_hidden_states.reshape(batch_size, sequence_length, hidden_dim)
+        return final_hidden_states, router_logits
\ No newline at end of file
diff --git a/text2text/mixtral/expert_cache.py b/text2text/mixtral/expert_cache.py
new file mode 100644
index 0000000..9d47625
--- /dev/null
+++ b/text2text/mixtral/expert_cache.py
@@ -0,0 +1,223 @@
+# MIT License
+#
+# Copyright (c) 2023 Artyom Eliseev, Denis Mazur
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+from dataclasses import dataclass, field
+from typing import Any, Dict, Optional, Iterator, Tuple, List
+from collections import deque, defaultdict, OrderedDict
+from .expert_wrapper import MixtralExpertWrapper
+
+import torch
+from torch import nn
+
+ExpertUID = Any
+
+
+@dataclass(frozen=False)
+class ExpertInfo:
+    uid: ExpertUID
+    eviction_group: int
+    offloaded: bool
+    index: int
+
+
+@dataclass
+class EvictionGroupInfo:
+    # infos in main and offload devices; ordered from least recently used to most
+    main_infos: OrderedDict[ExpertUID, ExpertInfo] = field(default_factory=OrderedDict)
+    offloaded_infos: OrderedDict[ExpertUID, ExpertInfo] = field(default_factory=OrderedDict)
+    hits: int = field(default=0)
+    misses: int = field(default=0)
+
+    def add(self, info: ExpertInfo):
+        infos_odict = self.offloaded_infos if info.offloaded else self.main_infos
+        assert info.uid not in infos_odict, f"expert {info.uid} already exists"
+        infos_odict[info.uid] = info
+
+    def choose_expert_to_evict(self) -> ExpertInfo:
+        for uid, info in self.main_infos.items():
+            return info  # least recently used
+        raise ValueError("No evictable experts")
+
+    def swap(self, info_to_load: ExpertInfo, info_to_evict: ExpertInfo):
+        assert info_to_load.uid in self.offloaded_infos and info_to_evict.uid in self.main_infos
+        self.main_infos[info_to_load.uid] = self.offloaded_infos.pop(info_to_load.uid)
+        self.main_infos.move_to_end(info_to_load.uid, last=True)
+        self.offloaded_infos[info_to_evict.uid] = self.main_infos.pop(info_to_evict.uid)
+
+    def mark_used(self, info: ExpertInfo):
+        if info.uid in self.main_infos:
+            self.main_infos.move_to_end(info.uid, last=True)
+            self.hits += 1
+        elif info.uid in self.offloaded_infos:
+            self.offloaded_infos.move_to_end(info.uid, last=True)
+            self.misses += 1
+        else:
+            raise ValueError(f"Expert {info} not in group")
+
+
+class ExpertCache:
+    def __init__(self, make_module: callable, main_size: int, offload_size: int, buffer_size: int):
+        """Dynamically loads an array of modules with identical hyperparameters"""
+        self.module_type = self.module_size = self.device = None
+        self.active = False
+
+        self.registered_experts: Dict[ExpertUID, ExpertInfo] = dict()
+
+        self.main_modules = [self._check_module(make_module()) for i in range(main_size)]
+        self.main_infos: List[Optional[ExpertInfo]] = [None for _ in range(main_size)]
+
+        assert self.module_size is not None
+        self.offloaded_storages = [
+            torch.UntypedStorage(self.module_size).pin_memory(self.device) for _ in range(offload_size)]
+        self.offloaded_infos: List[Optional[ExpertInfo]] = [None for _ in range(offload_size)]
+
+        # temporary storage to shave off latency
+        self.device_expert_buffers = deque([self._check_module(make_module()) for _ in range(buffer_size)])
+        self.offloaded_storage_buffers = deque([
+            torch.UntypedStorage(self.module_size).pin_memory(self.device) for _ in range(buffer_size)])
+        self.group_infos: Dict[int, EvictionGroupInfo] = defaultdict(EvictionGroupInfo)
+
+    def _check_module(self, module: MixtralExpertWrapper):
+        assert isinstance(module.storage, torch.UntypedStorage)
+        if self.module_type is None:
+            self.module_type = type(module)
+            self.module_size = len(module.storage)
+            self.device = module.storage.device
+        else:
+            assert isinstance(module, self.module_type)
+            assert len(module.storage) == self.module_size
+            assert module.storage.device == self.device
+        return module
+
+    def add_expert(self, uid: ExpertUID, module: MixtralExpertWrapper, eviction_group: int = 0,
+                   offload: Optional[bool] = None):
+        """Register an expert to the cache and associate it with uid"""
+        assert self.module_type is not None
+        assert isinstance(module, self.module_type)
+        return self.add_expert_storage(uid, module.storage, eviction_group=eviction_group, offload=offload)
+
+    def add_expert_storage(self, uid: ExpertUID, storage: torch.UntypedStorage,
+                           eviction_group: int = 0, offload: Optional[bool] = None):
+        assert uid not in self.registered_experts, f"expert {uid} already registered"
+        assert isinstance(storage, torch.UntypedStorage)
+        assert len(storage) == self.module_size
+
+        if offload is None or not offload:  # False or None
+            for i in range(len(self.main_modules)):
+                if self.main_infos[i] is None:
+                    self.main_modules[i].storage.copy_(storage)
+                    info = ExpertInfo(uid, eviction_group=eviction_group, offloaded=False, index=i)
+                    self.registered_experts[uid] = self.main_infos[i] = info
+                    self.group_infos[eviction_group].add(info)
+                    return  # done allocating; found spot on device
+        if offload is None or offload:  # True or None
+            for i in range(len(self.offloaded_storages)):
+                if self.offloaded_infos[i] is None:
+                    self.offloaded_storages[i].copy_(storage)
+                    info = ExpertInfo(uid, eviction_group=eviction_group, offloaded=True, index=i)
+                    self.registered_experts[uid] = self.offloaded_infos[i] = info
+                    self.group_infos[eviction_group].add(info)
+                    return  # done allocating; found an offloaded spot
+        raise ValueError("Cache is full")
+
+    def load_experts(
+            self, *uids: ExpertUID, unordered: bool = False) -> Iterator[Tuple[ExpertUID, MixtralExpertWrapper]]:
+        """
+        :example:
+        >>> for uid, expert in expert_cache.load_experts(*list_of_uids, unordered=True):
+        >>>     for uid, expert in expert_iter:
+        >>>         result += expert(x) * get_moe_weight(uid)
+
+        :param uids: iterate over the specified expert uids. Same uids as in add_expert
+        :param unordered: if True, allows cache to iterate experts in arbitrary order
+            The order is chosen to minimize the total wait time.
+        :returns: an iterator that yields (uid, expert) pairs, only usable inside the for loop
+
+        """
+        assert len(set(uids)) == len(uids)
+        assert not self.active, "already loading experts; buffers are busy"
+        if unordered:  # yield non-offloaded experts first
+            uids = sorted(uids, key=lambda uid: self.registered_experts[uid].offloaded)
+        infos = [self.registered_experts[uid] for uid in uids]
+
+        assert len(set(info.eviction_group for info in infos)) == 1, "experts must be in the same evicton group"
+        eviction_group = self.group_infos[infos[0].eviction_group]
+        for info in infos:
+            eviction_group.mark_used(info)
+
+        try:
+            self.active = True
+            # save pre-loaded experts before they can be swapped
+            pre_loaded_infos = deque([info for info in infos if not info.offloaded])
+            pre_loaded_experts = deque([self.main_modules[info.index] for info in pre_loaded_infos])
+
+            # begin loading experts into free buffers in background (via non-blocking copy)
+            infos_to_load = deque([info for info in infos if info.offloaded])
+            infos_in_loading = deque([])
+            experts_in_loading = deque([])
+            window_size = min(len(self.device_expert_buffers) - 1,
+                              len(eviction_group.main_infos),
+                              len(infos_to_load))
+            for _ in range(window_size):
+                info_to_load = infos_to_load.popleft()
+                infos_in_loading.append(info_to_load)
+                experts_in_loading.append(
+                    self._swap(info_to_load, eviction_group.choose_expert_to_evict()))
+
+            for info in infos:
+                if len(pre_loaded_infos) > 0 and info is pre_loaded_infos[0]:
+                    pre_loaded_infos.popleft()
+                    yield (info.uid, pre_loaded_experts.popleft())
+                elif len(infos_in_loading) > 0 and info is infos_in_loading[0]:
+                    infos_in_loading.popleft()
+                    yield (info.uid, experts_in_loading.popleft())
+                    if len(infos_to_load) > 0:
+                        info_to_load = infos_to_load.popleft()
+                        infos_in_loading.append(info_to_load)
+                        experts_in_loading.append(
+                            self._swap(info_to_load, eviction_group.choose_expert_to_evict()))
+                else:
+                    raise RuntimeError("internal error: caching algorithm failed")
+        finally:
+            self.active = False
+
+    def _swap(self, info_to_load: ExpertInfo, info_to_evict: ExpertInfo) -> nn.Module:
+        """Swap an offloaded expert (info_to_load) with an on-device expert (info_to_evict) return the loaded expert"""
+        assert info_to_load.offloaded and not info_to_evict.offloaded
+        assert info_to_load.eviction_group == info_to_evict.eviction_group
+        # swap a single on-device expert with a single offloaded expert using buffers for parallelism
+        offloaded_storage_buffer = self.offloaded_storage_buffers.popleft()
+        device_expert_buffer = self.device_expert_buffers.popleft()
+        device_expert_buffer.storage.copy_(self.offloaded_storages[info_to_load.index], non_blocking=True)
+        offloaded_storage_buffer.copy_(self.main_modules[info_to_evict.index].storage, non_blocking=True)
+
+        self.device_expert_buffers.append(self.main_modules[info_to_evict.index])
+        self.main_modules[info_to_evict.index] = device_expert_buffer
+        self.offloaded_storage_buffers.append(self.offloaded_storages[info_to_load.index])
+        self.offloaded_storages[info_to_load.index] = offloaded_storage_buffer
+
+        self.main_infos[info_to_evict.index] = info_to_load
+        self.offloaded_infos[info_to_load.index] = info_to_evict
+        info_to_evict.offloaded, info_to_load.offloaded = info_to_load.offloaded, info_to_evict.offloaded
+        info_to_evict.index, info_to_load.index = info_to_load.index, info_to_evict.index
+        self.group_infos[info_to_load.eviction_group].swap(info_to_load, info_to_evict)
+        return device_expert_buffer
\ No newline at end of file
diff --git a/text2text/mixtral/expert_wrapper.py b/text2text/mixtral/expert_wrapper.py
new file mode 100644
index 0000000..a37fdd3
--- /dev/null
+++ b/text2text/mixtral/expert_wrapper.py
@@ -0,0 +1,107 @@
+# MIT License
+#
+# Copyright (c) 2023 Artyom Eliseev, Denis Mazur
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+import typing as tp
+
+import torch
+from torch import nn
+
+from .utils import nested_flatten, nested_pack
+
+
+class MixtralExpertWrapper(nn.Module):
+    def __init__(
+        self,
+        expert_module: tp.Any,
+        device: torch.device,
+    ):
+        super().__init__()
+        
+        expert_module, self.storage = self.replace_layer_storage(expert_module, device)
+        self.expert_module = lambda *args, **kwargs: expert_module(*args, **kwargs)
+        
+        self._register_state_dict_hook(self._add_storage_to_state_dict_hook)
+        self._register_load_state_dict_pre_hook(self._load_storage_from_state_dict_hook)
+        
+    @staticmethod
+    def _add_storage_to_state_dict_hook(self, state_dict, prefix, local_metadata):
+        state_dict[prefix + 'storage'] = torch.as_tensor(self.storage, dtype=torch.uint8)
+        return state_dict
+    
+    def _load_storage_from_state_dict_hook(self, state_dict, prefix, local_metadata, strict, missing_keys, unexpected_keys, error_msgs):
+        self.storage.copy_(state_dict[prefix + 'storage'].storage().untyped())
+        del state_dict[prefix + 'storage']
+    
+    def forward(self, *args, **kwargs):
+        return self.expert_module(*args, **kwargs)
+    
+    
+    @staticmethod
+    def replace_layer_storage(
+        layer: tp.Any,
+        device: torch.device,
+    ):
+        state_dict = {
+            f"w{i}": {
+                "W_q": getattr(layer, f"w{i}").W_q,
+                "meta": getattr(layer, f"w{i}").meta,
+                "bias": getattr(layer, f"w{i}").bias,
+            }
+            for i in range(1, 4)
+        }
+
+        storage_size = 0
+        offsets = [0]
+
+        for x in nested_flatten(state_dict):
+            if not isinstance(x, torch.Tensor):
+                continue
+            storage_size += x.nbytes
+            offsets.append(storage_size)
+
+        storage = torch.UntypedStorage(storage_size, device=device) 
+
+        i = 0
+        new_flattened_states = list()
+        for x in nested_flatten(state_dict):
+            if not isinstance(x, torch.Tensor):
+                new_flattened_states.append(x)
+                continue
+
+            start = offsets[i]
+            end = offsets[i + 1]
+            a_view = torch.as_tensor(storage[start:end], dtype=x.dtype, device=device).view(x.shape)
+            a_view[...] = x
+            assert a_view.data_ptr() == storage.data_ptr() + start
+            i += 1
+            new_flattened_states.append(a_view)
+
+        state_dict = nested_pack(new_flattened_states, state_dict)
+
+        for layer_id, states in state_dict.items():
+            patched = getattr(layer, layer_id)
+            patched.W_q = states["W_q"]
+            patched.meta = states["meta"]
+            patched.bias = states["bias"]
+            setattr(layer, layer_id, patched)
+
+        return layer, storage
\ No newline at end of file
diff --git a/text2text/mixtral/packing.py b/text2text/mixtral/packing.py
new file mode 100644
index 0000000..3e1d6ef
--- /dev/null
+++ b/text2text/mixtral/packing.py
@@ -0,0 +1,135 @@
+# MIT License
+#
+# Copyright (c) 2023 Artyom Eliseev, Denis Mazur
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+import torch
+from hqq.core.quantize import Quantizer
+from hqq.core.bitpack import BitPack
+
+class PackedTensor(torch.Tensor):
+    def __init__(self, t: torch.Tensor):
+        self = t
+
+# 4 bit to uint8
+def pack_4bit_u8_common(W_q: torch.Tensor):
+    height = W_q.size(0)
+    assert height % 2 == 0
+    
+    W_q = W_q.to(torch.uint8)
+    p = (W_q[::2, ...] << 4) | (W_q[1::2, ...])
+
+    return PackedTensor(p.to(torch.uint8))
+
+def unpack_4bit_u8_common(W_q: torch.Tensor):
+    height = W_q.size(0)
+    W_q = W_q.to(torch.uint8)
+    result = torch.empty([2 * height] + list(W_q.shape[1:]),
+                         dtype=torch.uint8, device=W_q.device)
+    result[::2, ...] = (W_q >> 4)
+    result[1::2, ...] = (W_q & 0b1111)
+
+    return result
+
+def unpack_4bit_u8_universal(W_q: torch.Tensor):
+    if isinstance(W_q, PackedTensor):
+        return unpack_4bit_u8_common(W_q)
+    else:
+        return BitPack.unpack_4bit_u8(W_q)
+
+# 2 bit to uin8
+def pack_2bit_u8_common(W_q: torch.Tensor):
+    W_q = W_q.to(torch.uint8)
+    height = W_q.size(0)
+    p = (W_q[::4, ...] << 6) | (W_q[1::4, ...] << 4) | (W_q[2::4, ...] << 2) | (W_q[3::4, ...])
+
+    return PackedTensor(p)
+
+def unpack_2bit_u8_common(W_q: torch.Tensor):
+    W_q = W_q.to(torch.uint8)
+    height = W_q.size(0)
+    result = torch.empty([4 * height] + list(W_q.shape[1:]),
+                         dtype=torch.uint8, device=W_q.device)
+    result[::4, ...] = (W_q >> 6) & 0b11
+    result[1::4, ...] = (W_q >> 4) & 0b11
+    result[2::4, ...] = (W_q >> 2) & 0b11
+    result[3::4, ...] = W_q & 0b11
+
+    return result
+
+def unpack_2bit_u8_universal(W_q: torch.Tensor):
+    if isinstance(W_q, PackedTensor):
+        return unpack_2bit_u8_common(W_q)
+    else:
+        return BitPack.unpack_2bit_u8(W_q)
+
+# 3 bit to int32
+def pack_3bit_i32_common(W_q: torch.Tensor):
+    height = W_q.size(0)
+    
+    # rounding height to nearest 10, because i32 can fit 10 3-bit integers
+    rem = height % 10
+    if rem == 0:
+        rem = 10
+    
+    new_height = (height + 10 - 1) // 10
+    p = torch.zeros((new_height,) + W_q.shape[1:], device=W_q.device, dtype=torch.int32)
+    
+    for i in range(10):
+        if i < rem:
+            p |= W_q[i::10, ...].to(torch.int32) << (3 * (9 - i))
+        else:
+            p[:new_height - 1, ...] |= W_q[i::10, ...].to(torch.int32) << (3 * (9 - i))
+    
+    assert p.dtype == torch.int32
+
+    return PackedTensor(p)
+
+def unpack_3bit_i32_common(W_q: torch.Tensor):
+    """
+    There may be spare rows after unpacking (height is rounded to nearest multiple of 10)
+    """
+    
+    assert W_q.dtype == torch.int32
+    height = W_q.size(0)
+    
+    result = torch.empty([10 * height] + list(W_q.shape[1:]),
+                         dtype=torch.uint8, device=W_q.device)
+    
+    for i in range(10):
+        result[i::10, ...] = (W_q >> (3 * (9 - i))) & 0b111
+
+    return result
+
+def unpack_3bit_i32_universal(W_q: torch.Tensor):
+    if isinstance(W_q, PackedTensor):
+        return unpack_3bit_i32_common(W_q)
+    else:
+        return BitPack.unpack_3bit_32(W_q)
+
+def patch_packing():
+    Quantizer.pack['4bit_u8'] = pack_4bit_u8_common
+    Quantizer.unpack['4bit_u8'] = unpack_4bit_u8_universal
+    Quantizer.pack['2bit_u8'] = pack_2bit_u8_common
+    Quantizer.unpack['2bit_u8'] = unpack_2bit_u8_universal
+    Quantizer.pack['3bit_32'] = pack_3bit_i32_common
+    Quantizer.unpack['3bit_32'] = unpack_3bit_i32_universal
+
+patch_packing()
\ No newline at end of file
diff --git a/text2text/mixtral/triton_kernels.py b/text2text/mixtral/triton_kernels.py
new file mode 100644
index 0000000..2fc6626
--- /dev/null
+++ b/text2text/mixtral/triton_kernels.py
@@ -0,0 +1,586 @@
+# MIT License
+#
+# Copyright (c) 2023 Artyom Eliseev, Denis Mazur
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+import triton
+import triton.language as tl
+import torch
+from typing import Optional
+
+@triton.autotune(
+    configs=[
+        triton.Config({'BLOCK_SIZE_M': 16, 'BLOCK_SIZE_N': N,
+                       'BLOCK_SIZE_K': K, 'GROUP_SIZE_M': 1},
+                      num_stages=S, num_warps=W) for N, K, S, W in 
+        [
+#             (32, 16, 1, 2),
+            (32, 32, 4, 4),
+#             (32, 32, 5, 2),
+#             (32, 32, 5, 8),
+#             (32, 128, 2, 4),
+#             (64, 32, 2, 4),
+#             (64, 32, 3, 4),
+#             (64, 32, 4, 4),
+#             (64, 32, 4, 8),
+#             (64, 32, 5, 2),
+#             (64, 32, 5, 8),
+#             (64, 64, 3, 8),
+#             (128, 32, 2, 8),
+#             (128, 32, 3, 4),
+#             (128, 32, 3, 8),
+#             (128, 32, 4, 4),
+#             (128, 32, 4, 8),
+#             (256, 32, 3, 8),
+#             (256, 32, 4, 4),
+#             (256, 64, 3, 8),
+        ]
+
+    ],
+    key=['M', 'N', 'K'],
+)
+@triton.jit
+def matmul4_kernel_transpose(
+    a_ptr, b_ptr, c_ptr,
+    scales_ptr, zeros_ptr,
+    M, N, K,
+    stride_am, stride_ak,
+    stride_bn, stride_bk,
+    stride_cm, stride_cn,
+    stride_scales_g, stride_scales_n,
+    stride_zeros_g, stride_zeros_n,
+    groupsize, NO_GROUPS: tl.constexpr,
+    BLOCK_SIZE_M: tl.constexpr, BLOCK_SIZE_N: tl.constexpr, BLOCK_SIZE_K: tl.constexpr,
+    GROUP_SIZE_M: tl.constexpr,
+):
+    """
+    Compute the matrix multiplication C = A x B.
+    A is of shape (M, K) float16
+    B is of shape (N//2, K) int32
+    C is of shape (M, N) float16
+    scales is of shape (G, K) float16
+    zeros is of shape (G, K) int32
+    groupsize is an int specifying the size of groups for scales and zeros.
+    G is N // groupsize.
+    Set NO_GROUPS to groupsize == N, in which case G = 1 and the kernel is more efficient.
+
+    WARNING: This kernel assumes that K is a multiple of BLOCK_SIZE_K.
+    WARNING: This kernel assumes that N is a multiple of BLOCK_SIZE_N.
+    WARNING: This kernel assumes that groupsize is a multiple of BLOCK_SIZE_K.
+    """
+    pid = tl.program_id(axis=0)
+    num_pid_m = tl.cdiv(M, BLOCK_SIZE_M)
+    num_pid_n = tl.cdiv(N, BLOCK_SIZE_N)
+    num_pid_k = tl.cdiv(K, BLOCK_SIZE_K)
+    
+    num_pid_in_group = GROUP_SIZE_M * num_pid_n
+    group_id = pid // num_pid_in_group # 
+    first_pid_m = group_id * GROUP_SIZE_M
+    group_size_m = min(num_pid_m - first_pid_m, GROUP_SIZE_M)
+    pid_m = first_pid_m + (pid % group_size_m)
+    pid_n = (pid % num_pid_in_group) // group_size_m
+
+    offs_am = pid_m * BLOCK_SIZE_M + tl.arange(0, BLOCK_SIZE_M)
+    offs_bn = pid_n * BLOCK_SIZE_N + tl.arange(0, BLOCK_SIZE_N)
+    offs_k = tl.arange(0, BLOCK_SIZE_K)
+    a_ptrs = a_ptr + (offs_am[:, None] * stride_am + offs_k[None, :] * stride_ak)   # (BLOCK_SIZE_M, BLOCK_SIZE_K)
+    a_mask = (offs_am[:, None] < M)
+    # b_ptrs is set up such that it repeats elements along the N axis 2 times
+    b_ptrs = b_ptr + (offs_k[:, None] * stride_bk + (offs_bn[None, :] // 2) * stride_bn)   # (BLOCK_SIZE_K, BLOCK_SIZE_N)
+    
+    G = N // groupsize
+    scales_ptrs = scales_ptr + (offs_bn[None, :] % G) * stride_scales_g   # (1, BLOCK_SIZE_N)
+    zeros_ptrs = zeros_ptr + (offs_bn[None, :] % G) * stride_zeros_g   # (1, BLOCK_SIZE_N)
+
+    # shifter is used to extract the 4 bits of each element in the 8-bit word from B
+    shifter = ((offs_bn + 1) % 2) * 4
+
+    # If G == 1, scales and zeros are the same for all N, so we can load them once
+    if NO_GROUPS:
+        # Fetch scales and zeros; these are per-outfeature and thus reused in the inner loop
+        scales = tl.load(scales_ptrs)  # (BLOCK_SIZE_N,)
+        zeros = tl.load(zeros_ptrs)  # (BLOCK_SIZE_N,), each element is repeated 8 times, int32
+
+    # Now calculate a block of output of shape (BLOCK_SIZE_M, BLOCK_SIZE_N)
+    # M is along the batch dimension, N is along the outfeatures dimension, K is along the infeatures dimension
+    # So this loop is along the infeatures dimension (K)
+    # It's calculating BLOCK_SIZE_M batches in parallel, and for each batch, BLOCK_SIZE_N outfeatures in parallel
+    accumulator = tl.zeros((BLOCK_SIZE_M, BLOCK_SIZE_N), dtype=tl.float32)
+    for k in range(0, num_pid_k):
+        a = tl.load(a_ptrs, mask=a_mask, other=0.)   # (BLOCK_SIZE_M, BLOCK_SIZE_K)
+        b = tl.load(b_ptrs)   # (BLOCK_SIZE_K, BLOCK_SIZE_N), but repeated
+
+        if not NO_GROUPS:
+            offs_k_scale = BLOCK_SIZE_K * k + offs_k
+            ptr = scales_ptrs + offs_k_scale[:, None] * stride_scales_n  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+            scales = tl.load(ptr)  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+            ptr = zeros_ptrs + offs_k_scale[:, None] * stride_zeros_n  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+            zeros = tl.load(ptr)  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+
+        # Now we need to unpack b (which is 4-bit values) into 8-bit values
+        b = (b >> shifter[None, :]) & 0xF  # Extract the 4-bit values
+        b = b.to(tl.float16)
+        b = (b - zeros) * scales # Scale and shift
+
+        accumulator += tl.dot(a, b)
+        a_ptrs += BLOCK_SIZE_K * stride_ak
+        b_ptrs += BLOCK_SIZE_K * stride_bk
+
+    c = accumulator.to(tl.float16)
+
+    # Store the result
+    offs_cm = pid_m * BLOCK_SIZE_M + tl.arange(0, BLOCK_SIZE_M)
+    offs_cn = pid_n * BLOCK_SIZE_N + tl.arange(0, BLOCK_SIZE_N)
+    c_ptrs = c_ptr + stride_cm * offs_cm[:, None] + stride_cn * offs_cn[None, :]
+    c_mask = (offs_cm[:, None] < M) & (offs_cn[None, :] < N)
+    tl.store(c_ptrs, accumulator, mask=c_mask)
+
+def triton_matmul4_transpose(groupsize: int, a: torch.FloatTensor, qweight: torch.IntTensor, scales: torch.FloatTensor, zeros: torch.FloatTensor, bias: Optional[torch.FloatTensor] = None) -> torch.FloatTensor:
+    """
+    Compute the matrix multiplication C = A x B + bias.
+    Where B is quantized using GPTQ and groupsize = -1 into 4-bit values.
+
+    A is of shape (M, K) float16
+    qweight is of shape (N//2, K) int32
+    scales is of shape (G, K) float16
+    zeros is of shape (G, K) float16
+    bias is of shape (1, N) float16
+
+    groupsize is the number of infeatures in each group.
+    G = N // groupsize
+    
+    C = A @ qweight.T
+    Returns C of shape (..., N) float16
+    """
+    assert a.shape[-1] == (qweight.shape[1])
+    assert a.is_contiguous(), "A must be contiguous"
+    assert scales.shape[1] == zeros.shape[1]
+    assert scales.shape[1] == qweight.shape[1]
+
+    # Flatten a into (-1, K)
+    x = a.view(-1, a.shape[-1])
+
+    M, K = x.shape
+    N = qweight.shape[0] * 2
+    # This is based on the possible BLOCK_SIZE_Ks
+#     assert K % 16 == 0 and K % 32 == 0 and K % 64 == 0 and K % 128 == 0, "K must be a multiple of 16, 32, 64, and 128"
+    # This is based on the possible BLOCK_SIZE_Ns
+#     assert N % 16 == 0 and N % 32 == 0 and N % 64 == 0 and N % 128 == 0 and N % 256 == 0, "N must be a multiple of 16, 32, 64, 128, and 256"
+    # This is based on the possible BLOCK_SIZE_Ks
+#     assert groupsize % 32 == 0 and groupsize % 64 == 0 and groupsize % 128 == 0, "groupsize must be a multiple of 32, 64, and 128"
+
+    c = torch.empty((M, N), device='cuda', dtype=torch.float16)
+
+    grid = lambda META: (
+        triton.cdiv(M, META['BLOCK_SIZE_M']) * triton.cdiv(N, META['BLOCK_SIZE_N']),
+    )
+    matmul4_kernel_transpose[grid](
+        x, qweight, c,
+        scales, zeros,
+        M, N, K,
+        x.stride(0), x.stride(1),
+        qweight.stride(0), qweight.stride(1),
+        c.stride(0), c.stride(1),
+        scales.stride(0), scales.stride(1),
+        zeros.stride(0), zeros.stride(1),
+        groupsize, groupsize == N,
+    )
+    
+    # Reshape c
+    c = c.view(a.shape[:-1] + (N,))  # (..., N)
+
+    # Add bias
+    if bias is not None:
+        c = c + bias
+
+    return c
+
+
+@triton.autotune(
+    configs=[
+        triton.Config({'BLOCK_SIZE_M': 16, 'BLOCK_SIZE_N': N,
+                       'BLOCK_SIZE_K': K, 'GROUP_SIZE_M': 1},
+                      num_stages=S, num_warps=W) for N, K, S, W in 
+        [
+#             (32, 16, 1, 2),
+            (32, 32, 4, 4),  # best
+#             (32, 32, 5, 2),
+#             (32, 32, 5, 8),
+#             (32, 128, 2, 4),
+#             (64, 32, 2, 4),
+#             (64, 32, 3, 4),
+#             (64, 32, 4, 4),
+#             (64, 32, 4, 8),
+#             (64, 32, 5, 2),
+#             (64, 32, 5, 8),
+#             (64, 64, 3, 8),
+#             (128, 32, 2, 8),
+#             (128, 32, 3, 4),
+#             (128, 32, 3, 8),
+#             (128, 32, 4, 4),
+#             (128, 32, 4, 8),
+#             (256, 32, 3, 8),
+#             (256, 32, 4, 4),
+#             (256, 64, 3, 8),
+        ]
+
+    ],
+    key=['M', 'N', 'K'],
+)
+@triton.jit
+def matmul2_kernel_transpose(
+    a_ptr, b_ptr, c_ptr,
+    scales_ptr, zeros_ptr,
+    M, N, K,
+    stride_am, stride_ak,
+    stride_bn, stride_bk,
+    stride_cm, stride_cn,
+    stride_scales_g, stride_scales_n,
+    stride_zeros_g, stride_zeros_n,
+    groupsize, NO_GROUPS: tl.constexpr,
+    BLOCK_SIZE_M: tl.constexpr, BLOCK_SIZE_N: tl.constexpr, BLOCK_SIZE_K: tl.constexpr,
+    GROUP_SIZE_M: tl.constexpr,
+):
+    """
+    Compute the matrix multiplication C = A x B.
+    A is of shape (M, K) float16
+    B is of shape (N // 4, K) int8
+    C is of shape (M, N) float16
+    scales is of shape (G, K) float16
+    zeros is of shape (G, K) int32
+    groupsize is an int specifying the size of groups for scales and zeros.
+    G is N // groupsize.
+    Set NO_GROUPS to groupsize == N, in which case G = 1 and the kernel is more efficient.
+
+    WARNING: This kernel assumes that K is a multiple of BLOCK_SIZE_K.
+    WARNING: This kernel assumes that N is a multiple of BLOCK_SIZE_N.
+    WARNING: This kernel assumes that groupsize is a multiple of BLOCK_SIZE_K.
+    """
+    pid = tl.program_id(axis=0)
+    num_pid_m = tl.cdiv(M, BLOCK_SIZE_M)
+    num_pid_n = tl.cdiv(N, BLOCK_SIZE_N)
+    num_pid_k = tl.cdiv(K, BLOCK_SIZE_K)
+    
+    num_pid_in_group = GROUP_SIZE_M * num_pid_n
+    group_id = pid // num_pid_in_group # 
+    first_pid_m = group_id * GROUP_SIZE_M
+    group_size_m = min(num_pid_m - first_pid_m, GROUP_SIZE_M)
+    pid_m = first_pid_m + (pid % group_size_m)
+    pid_n = (pid % num_pid_in_group) // group_size_m
+
+    offs_am = pid_m * BLOCK_SIZE_M + tl.arange(0, BLOCK_SIZE_M)
+    offs_bn = pid_n * BLOCK_SIZE_N + tl.arange(0, BLOCK_SIZE_N)
+    offs_k = tl.arange(0, BLOCK_SIZE_K)
+    a_ptrs = a_ptr + (offs_am[:, None] * stride_am + offs_k[None, :] * stride_ak)   # (BLOCK_SIZE_M, BLOCK_SIZE_K)
+    a_mask = (offs_am[:, None] < M)
+    # b_ptrs is set up such that it repeats elements along the N axis 4 times
+    b_ptrs = b_ptr + (offs_k[:, None] * stride_bk + (offs_bn[None, :] // 4) * stride_bn)   # (BLOCK_SIZE_K, BLOCK_SIZE_N)
+    
+    G = N // groupsize
+    scales_ptrs = scales_ptr + (offs_bn[None, :] % G) * stride_scales_g   # (1, BLOCK_SIZE_N)
+    zeros_ptrs = zeros_ptr + (offs_bn[None, :] % G) * stride_zeros_g   # (1, BLOCK_SIZE_N)
+
+    # shifter is used to extract the 2 bits of each element in the 8-bit word from B
+    shifter = (3 - (offs_bn % 4)) * 2
+
+    # If G == 1, scales and zeros are the same for all N, so we can load them once
+    if NO_GROUPS:
+        # Fetch scales and zeros; these are per-outfeature and thus reused in the inner loop
+        scales = tl.load(scales_ptrs)  # (BLOCK_SIZE_N,)
+        zeros = tl.load(zeros_ptrs)  # (BLOCK_SIZE_N,)
+
+    # Now calculate a block of output of shape (BLOCK_SIZE_M, BLOCK_SIZE_N)
+    # M is along the batch dimension, N is along the outfeatures dimension, K is along the infeatures dimension
+    # So this loop is along the infeatures dimension (K)
+    # It's calculating BLOCK_SIZE_M batches in parallel, and for each batch, BLOCK_SIZE_N outfeatures in parallel
+    accumulator = tl.zeros((BLOCK_SIZE_M, BLOCK_SIZE_N), dtype=tl.float32)
+    for k in range(0, num_pid_k):
+        a = tl.load(a_ptrs, mask=a_mask, other=0.)   # (BLOCK_SIZE_M, BLOCK_SIZE_K)
+        b = tl.load(b_ptrs)   # (BLOCK_SIZE_K, BLOCK_SIZE_N), but repeated
+
+        if not NO_GROUPS:
+            offs_k_scale = BLOCK_SIZE_K * k + offs_k
+            ptr = scales_ptrs + offs_k_scale[:, None] * stride_scales_n  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+            scales = tl.load(ptr)  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+            ptr = zeros_ptrs + offs_k_scale[:, None] * stride_zeros_n  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+            zeros = tl.load(ptr)  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+
+        # Now we need to unpack b (which is 4-bit values) into 8-bit values
+        b = (b >> shifter[None, :]) & 0b11  # Extract the 2-bit values
+        b = b.to(tl.float16)
+        b = (b - zeros) * scales # Scale and shift
+
+        accumulator += tl.dot(a, b)
+        a_ptrs += BLOCK_SIZE_K * stride_ak
+        b_ptrs += BLOCK_SIZE_K * stride_bk
+
+    c = accumulator.to(tl.float16)
+
+    # Store the result
+    offs_cm = pid_m * BLOCK_SIZE_M + tl.arange(0, BLOCK_SIZE_M)
+    offs_cn = pid_n * BLOCK_SIZE_N + tl.arange(0, BLOCK_SIZE_N)
+    c_ptrs = c_ptr + stride_cm * offs_cm[:, None] + stride_cn * offs_cn[None, :]
+    c_mask = (offs_cm[:, None] < M) & (offs_cn[None, :] < N)
+    tl.store(c_ptrs, accumulator, mask=c_mask)
+
+def triton_matmul2_transpose(groupsize: int, a: torch.FloatTensor, qweight: torch.IntTensor, scales: torch.FloatTensor, zeros: torch.FloatTensor, bias: Optional[torch.FloatTensor] = None) -> torch.FloatTensor:
+    """
+    Compute the matrix multiplication C = A x B + bias.
+    Where B is quantized using GPTQ and groupsize = -1 into 4-bit values.
+
+    A is of shape (M, K) float16
+    qweight is of shape (N // 4, K) int32
+    scales is of shape (G, K) float16
+    zeros is of shape (G, K) float16
+    bias is of shape (1, N) float16
+
+    groupsize is the number of infeatures in each group.
+    G = N // groupsize
+    
+    C = A @ qweight.T
+    Returns C of shape (..., N) float16
+    """
+    
+    assert a.shape[-1] == (qweight.shape[1])
+    assert a.is_contiguous(), "A must be contiguous"
+    assert scales.shape[1] == zeros.shape[1]
+    assert scales.shape[1] == qweight.shape[1]
+
+    # Flatten a into (-1, K)
+    x = a.view(-1, a.shape[-1])
+
+    M, K = x.shape
+    N = qweight.shape[0] * 4
+    # This is based on the possible BLOCK_SIZE_Ks
+#     assert K % 16 == 0 and K % 32 == 0 and K % 64 == 0 and K % 128 == 0, "K must be a multiple of 16, 32, 64, and 128"
+    # This is based on the possible BLOCK_SIZE_Ns
+#     assert N % 16 == 0 and N % 32 == 0 and N % 64 == 0 and N % 128 == 0 and N % 256 == 0, "N must be a multiple of 16, 32, 64, 128, and 256"
+    # This is based on the possible BLOCK_SIZE_Ks
+#     assert groupsize % 32 == 0 and groupsize % 64 == 0 and groupsize % 128 == 0, "groupsize must be a multiple of 32, 64, and 128"
+
+    c = torch.empty((M, N), device='cuda', dtype=torch.float16)
+
+    grid = lambda META: (
+        triton.cdiv(M, META['BLOCK_SIZE_M']) * triton.cdiv(N, META['BLOCK_SIZE_N']),
+    )
+    matmul2_kernel_transpose[grid](
+        x, qweight, c,
+        scales, zeros,
+        M, N, K,
+        x.stride(0), x.stride(1),
+        qweight.stride(0), qweight.stride(1),
+        c.stride(0), c.stride(1),
+        scales.stride(0), scales.stride(1),
+        zeros.stride(0), zeros.stride(1),
+        groupsize, groupsize == N,
+    )
+    
+    # Reshape c
+    c = c.view(a.shape[:-1] + (N,))  # (..., N)
+
+    # Add bias
+    if bias is not None:
+        c = c + bias
+
+    return c
+
+
+@triton.autotune(
+    configs=[
+        triton.Config({'BLOCK_SIZE_M': 16, 'BLOCK_SIZE_N': N,
+                       'BLOCK_SIZE_K': K, 'GROUP_SIZE_M': 1},
+                      num_stages=S, num_warps=W) for N, K, S, W in 
+        [
+#             (32, 16, 1, 2),
+#             (32, 32, 4, 4),
+#             (32, 32, 5, 2),
+            (32, 32, 5, 8),  # best
+#             (32, 128, 2, 4),
+#             (64, 32, 2, 4),
+#             (64, 32, 3, 4),
+#             (64, 32, 4, 4),
+#             (64, 32, 4, 8),
+#             (64, 32, 5, 2),
+#             (64, 32, 5, 8),
+#             (64, 64, 3, 8),
+#             (128, 32, 2, 8),
+#             (128, 32, 3, 4),
+#             (128, 32, 3, 8),
+#             (128, 32, 4, 4),
+#             (128, 32, 4, 8),
+#             (256, 32, 3, 8),
+#             (256, 32, 4, 4),
+#             (256, 64, 3, 8),
+        ]
+
+    ],
+    key=['M', 'N', 'K'],
+)
+@triton.jit
+def matmul3_kernel_transpose(
+    a_ptr, b_ptr, c_ptr,
+    scales_ptr, zeros_ptr,
+    M, N, K,
+    stride_am, stride_ak,
+    stride_bn, stride_bk,
+    stride_cm, stride_cn,
+    stride_scales_g, stride_scales_n,
+    stride_zeros_g, stride_zeros_n,
+    groupsize, NO_GROUPS: tl.constexpr,
+    BLOCK_SIZE_M: tl.constexpr, BLOCK_SIZE_N: tl.constexpr, BLOCK_SIZE_K: tl.constexpr,
+    GROUP_SIZE_M: tl.constexpr,
+):
+    """
+    Compute the matrix multiplication C = A x B.
+    A is of shape (M, K) float16
+    B is of shape (ceil(N / 10), K) int32
+    C is of shape (M, N) float16
+    scales is of shape (G, K) float16
+    zeros is of shape (G, K) int32
+    groupsize is an int specifying the size of groups for scales and zeros.
+    G is N // groupsize.
+    Set NO_GROUPS to groupsize == N, in which case G = 1 and the kernel is more efficient.
+
+    WARNING: This kernel assumes that K is a multiple of BLOCK_SIZE_K.
+    WARNING: This kernel assumes that N is a multiple of BLOCK_SIZE_N.
+    WARNING: This kernel assumes that groupsize is a multiple of BLOCK_SIZE_K.
+    """
+    pid = tl.program_id(axis=0)
+    num_pid_m = tl.cdiv(M, BLOCK_SIZE_M)
+    num_pid_n = tl.cdiv(N, BLOCK_SIZE_N)
+    num_pid_k = tl.cdiv(K, BLOCK_SIZE_K)
+    
+    num_pid_in_group = GROUP_SIZE_M * num_pid_n
+    group_id = pid // num_pid_in_group # 
+    first_pid_m = group_id * GROUP_SIZE_M
+    group_size_m = min(num_pid_m - first_pid_m, GROUP_SIZE_M)
+    pid_m = first_pid_m + (pid % group_size_m)
+    pid_n = (pid % num_pid_in_group) // group_size_m
+
+    offs_am = pid_m * BLOCK_SIZE_M + tl.arange(0, BLOCK_SIZE_M)
+    offs_bn = pid_n * BLOCK_SIZE_N + tl.arange(0, BLOCK_SIZE_N)
+    offs_k = tl.arange(0, BLOCK_SIZE_K)
+    a_ptrs = a_ptr + (offs_am[:, None] * stride_am + offs_k[None, :] * stride_ak)   # (BLOCK_SIZE_M, BLOCK_SIZE_K)
+    a_mask = (offs_am[:, None] < M)
+    
+    # b_ptrs is set up such that it repeats elements along the N axis 10 times
+    b_ptrs = b_ptr + (offs_k[:, None] * stride_bk + (offs_bn[None, :] // 10) * stride_bn)   # (BLOCK_SIZE_K, BLOCK_SIZE_N)
+    
+    G = N // groupsize
+    scales_ptrs = scales_ptr + (offs_bn[None, :] % G) * stride_scales_g   # (1, BLOCK_SIZE_N)
+    zeros_ptrs = zeros_ptr + (offs_bn[None, :] % G) * stride_zeros_g   # (1, BLOCK_SIZE_N)
+
+    # shifter is used to extract the 3 bits of each element in the 32-bit word from B
+    shifter = (9 - (offs_bn % 10)) * 3
+
+    # If G == 1, scales and zeros are the same for all N, so we can load them once
+    if NO_GROUPS:
+        # Fetch scales and zeros; these are per-outfeature and thus reused in the inner loop
+        scales = tl.load(scales_ptrs)  # (BLOCK_SIZE_N,)
+        zeros = tl.load(zeros_ptrs)  # (BLOCK_SIZE_N,)
+
+    # Now calculate a block of output of shape (BLOCK_SIZE_M, BLOCK_SIZE_N)
+    # M is along the batch dimension, N is along the outfeatures dimension, K is along the infeatures dimension
+    # So this loop is along the infeatures dimension (K)
+    # It's calculating BLOCK_SIZE_M batches in parallel, and for each batch, BLOCK_SIZE_N outfeatures in parallel
+    accumulator = tl.zeros((BLOCK_SIZE_M, BLOCK_SIZE_N), dtype=tl.float32)
+    for k in range(0, num_pid_k):
+        a = tl.load(a_ptrs, mask=a_mask, other=0.)   # (BLOCK_SIZE_M, BLOCK_SIZE_K)
+        b = tl.load(b_ptrs)   # (BLOCK_SIZE_K, BLOCK_SIZE_N), but repeated
+
+        if not NO_GROUPS:
+            offs_k_scale = BLOCK_SIZE_K * k + offs_k
+            ptr = scales_ptrs + offs_k_scale[:, None] * stride_scales_n  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+            scales = tl.load(ptr)  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+            ptr = zeros_ptrs + offs_k_scale[:, None] * stride_zeros_n  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+            zeros = tl.load(ptr)  # (BLOCK_SIZE_K, BLOCK_SIZE_N,)
+
+        # Now we need to unpack b (which is 3-bit values into 32-bit values)
+        b = (b >> shifter[None, :]) & 0b111  # Extract the 3-bit values
+        b = b.to(tl.float16)
+        b = (b - zeros) * scales # Scale and shift
+
+        accumulator += tl.dot(a, b)
+        a_ptrs += BLOCK_SIZE_K * stride_ak
+        b_ptrs += BLOCK_SIZE_K * stride_bk
+
+    c = accumulator.to(tl.float16)
+
+    # Store the result
+    offs_cm = pid_m * BLOCK_SIZE_M + tl.arange(0, BLOCK_SIZE_M)
+    offs_cn = pid_n * BLOCK_SIZE_N + tl.arange(0, BLOCK_SIZE_N)
+    c_ptrs = c_ptr + stride_cm * offs_cm[:, None] + stride_cn * offs_cn[None, :]
+    c_mask = (offs_cm[:, None] < M) & (offs_cn[None, :] < N)
+    tl.store(c_ptrs, accumulator, mask=c_mask)
+
+def triton_matmul3_transpose(groupsize: int, a: torch.FloatTensor, qweight: torch.IntTensor, scales: torch.FloatTensor, zeros: torch.FloatTensor, N: int, bias: Optional[torch.FloatTensor] = None) -> torch.FloatTensor:
+    """
+    Compute the matrix multiplication C = A x B + bias.
+    Where B is quantized using GPTQ and groupsize = -1 into 4-bit values.
+
+    A is of shape (M, K) float16
+    qweight is of shape (ceil(N / 10), K) int32
+    scales is of shape (G, K) float16
+    zeros is of shape (G, K) float16
+    bias is of shape (1, N) float16
+
+    groupsize is the number of infeatures in each group.
+    G = N // groupsize
+    
+    C = A @ qweight.T
+    Returns C of shape (..., N) float16
+    """
+    
+    assert a.shape[-1] == (qweight.shape[1])
+    assert a.is_contiguous(), "A must be contiguous"
+    assert scales.shape[1] == zeros.shape[1]
+    assert scales.shape[1] == qweight.shape[1]
+
+    # Flatten a into (-1, K)
+    x = a.view(-1, a.shape[-1])
+
+    M, K = x.shape
+    assert 0 <= (qweight.shape[0] * 10 - N) < 10
+
+    c = torch.empty((M, N), device='cuda', dtype=torch.float16)
+
+    grid = lambda META: (
+        triton.cdiv(M, META['BLOCK_SIZE_M']) * triton.cdiv(N, META['BLOCK_SIZE_N']),
+    )
+    matmul3_kernel_transpose[grid](
+        x, qweight, c,
+        scales, zeros,
+        M, N, K,
+        x.stride(0), x.stride(1),
+        qweight.stride(0), qweight.stride(1),
+        c.stride(0), c.stride(1),
+        scales.stride(0), scales.stride(1),
+        zeros.stride(0), zeros.stride(1),
+        groupsize, groupsize == N,
+    )
+    
+    # Reshape c
+    c = c.view(a.shape[:-1] + (N,))  # (..., N)
+
+    # Add bias
+    if bias is not None:
+        c = c + bias
+
+    return c
\ No newline at end of file
diff --git a/text2text/mixtral/utils.py b/text2text/mixtral/utils.py
new file mode 100644
index 0000000..32a2464
--- /dev/null
+++ b/text2text/mixtral/utils.py
@@ -0,0 +1,123 @@
+# MIT License
+#
+# Copyright (c) 2023 Artyom Eliseev, Denis Mazur
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+
+# The above copyright notice and this permission notice shall be included in all
+# copies or substantial portions of the Software.
+
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+# SOFTWARE.
+
+from contextlib import contextmanager
+import torch
+""" utility functions that help you process nested dicts, tuples, lists and namedtuples """
+
+
+def nested_compare(t, u):
+    """
+    Return whether nested structure of t1 and t2 matches.
+    """
+    if isinstance(t, (list, tuple)):
+        if not isinstance(u, type(t)):
+            return False
+        if len(t) != len(u):
+            return False
+        for a, b in zip(t, u):
+            if not nested_compare(a, b):
+                return False
+        return True
+
+    if isinstance(t, dict):
+        if not isinstance(u, dict):
+            return False
+        if set(t.keys()) != set(u.keys()):
+            return False
+        for k in t:
+            if not nested_compare(t[k], u[k]):
+                return False
+        return True
+
+    else:
+        return True
+
+
+def nested_flatten(t):
+    """
+    Turn nested list/tuple/dict into a flat iterator.
+    """
+    if isinstance(t, (list, tuple)):
+        for x in t:
+            yield from nested_flatten(x)
+    elif isinstance(t, dict):
+        for k, v in sorted(t.items()):
+            yield from nested_flatten(v)
+    else:
+        yield t
+
+
+def nested_pack(flat, structure):
+    """
+    Restore nested structure from flattened state
+    :param flat: result of nested_flatten
+    :param structure: used as example when recovering structure
+    :returns: nested structure like :structure: filled with elements of :flat:
+    """
+    return _nested_pack(iter(flat), structure)
+
+
+def _nested_pack(flat_iter, structure):
+    if is_namedtuple(structure):
+        return type(structure)(*[_nested_pack(flat_iter, x) for x in structure])
+    elif isinstance(structure, (list, tuple)):
+        return type(structure)(_nested_pack(flat_iter, x) for x in structure)
+    elif isinstance(structure, dict):
+        return {k: _nested_pack(flat_iter, v) for k, v in sorted(structure.items())}
+    else:
+        return next(flat_iter)
+
+
+def is_namedtuple(x):
+    """Checks if x is a namedtuple instance. Taken from https://stackoverflow.com/a/2166841 ."""
+    t = type(x)
+    b = t.__bases__
+    if len(b) != 1 or b[0] != tuple:
+        return False
+    f = getattr(t, "_fields", None)
+    if not isinstance(f, tuple):
+        return False
+    return all(type(n) == str for n in f)
+
+
+def nested_map(fn, *t):
+    # Check arguments.
+    if not t:
+        raise ValueError("Expected 2+ arguments, got 1")
+    for i in range(1, len(t)):
+        if not nested_compare(t[0], t[i]):
+            msg = "Nested structure of %r and %r differs"
+            raise ValueError(msg % (t[0], t[i]))
+
+    flat = map(nested_flatten, t)
+    return nested_pack(map(fn, *flat), t[0])
+
+@contextmanager
+def with_default_dtype(dtype):
+    _dtype_original = torch.get_default_dtype()
+
+    try:
+        torch.set_default_dtype(dtype)
+        yield
+    finally:
+        torch.set_default_dtype(_dtype_original)
\ No newline at end of file