llm-finetuning

Форк
0
/
12_Fine_tuning_Microsoft_Phi_1_5b_on_custom_dataset(dialogstudio).ipynb 
8454 строки · 342.3 Кб
1
{
2
  "cells": [
3
    {
4
      "cell_type": "markdown",
5
      "metadata": {
6
        "id": "view-in-github",
7
        "colab_type": "text"
8
      },
9
      "source": [
10
        "<a href=\"https://colab.research.google.com/github/ashishpatel26/LLM-Finetuning/blob/main/12_Fine_tuning_Microsoft_Phi_1_5b_on_custom_dataset(dialogstudio).ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
11
      ]
12
    },
13
    {
14
      "cell_type": "code",
15
      "execution_count": 1,
16
      "metadata": {
17
        "colab": {
18
          "base_uri": "https://localhost:8080/"
19
        },
20
        "id": "SwcwXRajHelL",
21
        "outputId": "df5a4f77-5b26-42e9-b04d-7d238c321c41"
22
      },
23
      "outputs": [
24
        {
25
          "output_type": "stream",
26
          "name": "stdout",
27
          "text": [
28
            "Thu Sep 21 11:23:52 2023       \n",
29
            "+-----------------------------------------------------------------------------+\n",
30
            "| NVIDIA-SMI 525.105.17   Driver Version: 525.105.17   CUDA Version: 12.0     |\n",
31
            "|-------------------------------+----------------------+----------------------+\n",
32
            "| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |\n",
33
            "| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |\n",
34
            "|                               |                      |               MIG M. |\n",
35
            "|===============================+======================+======================|\n",
36
            "|   0  Tesla T4            Off  | 00000000:00:04.0 Off |                    0 |\n",
37
            "| N/A   60C    P8    11W /  70W |      0MiB / 15360MiB |      0%      Default |\n",
38
            "|                               |                      |                  N/A |\n",
39
            "+-------------------------------+----------------------+----------------------+\n",
40
            "                                                                               \n",
41
            "+-----------------------------------------------------------------------------+\n",
42
            "| Processes:                                                                  |\n",
43
            "|  GPU   GI   CI        PID   Type   Process name                  GPU Memory |\n",
44
            "|        ID   ID                                                   Usage      |\n",
45
            "|=============================================================================|\n",
46
            "|  No running processes found                                                 |\n",
47
            "+-----------------------------------------------------------------------------+\n"
48
          ]
49
        }
50
      ],
51
      "source": [
52
        "!nvidia-smi"
53
      ]
54
    },
55
    {
56
      "cell_type": "code",
57
      "source": [
58
        "!pip install accelerate transformers einops datasets peft bitsandbytes trl"
59
      ],
60
      "metadata": {
61
        "colab": {
62
          "base_uri": "https://localhost:8080/"
63
        },
64
        "id": "wH8jsePrSGTH",
65
        "outputId": "53bf1128-bbbb-4319-c7bb-21820389d3f6"
66
      },
67
      "execution_count": 2,
68
      "outputs": [
69
        {
70
          "output_type": "stream",
71
          "name": "stdout",
72
          "text": [
73
            "Collecting accelerate\n",
74
            "  Downloading accelerate-0.23.0-py3-none-any.whl (258 kB)\n",
75
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m258.1/258.1 kB\u001b[0m \u001b[31m3.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
76
            "\u001b[?25hCollecting transformers\n",
77
            "  Downloading transformers-4.33.2-py3-none-any.whl (7.6 MB)\n",
78
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.6/7.6 MB\u001b[0m \u001b[31m18.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
79
            "\u001b[?25hCollecting einops\n",
80
            "  Downloading einops-0.6.1-py3-none-any.whl (42 kB)\n",
81
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m42.2/42.2 kB\u001b[0m \u001b[31m5.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
82
            "\u001b[?25hCollecting datasets\n",
83
            "  Downloading datasets-2.14.5-py3-none-any.whl (519 kB)\n",
84
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m519.6/519.6 kB\u001b[0m \u001b[31m26.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
85
            "\u001b[?25hCollecting peft\n",
86
            "  Downloading peft-0.5.0-py3-none-any.whl (85 kB)\n",
87
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m85.6/85.6 kB\u001b[0m \u001b[31m9.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
88
            "\u001b[?25hCollecting bitsandbytes\n",
89
            "  Downloading bitsandbytes-0.41.1-py3-none-any.whl (92.6 MB)\n",
90
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m92.6/92.6 MB\u001b[0m \u001b[31m11.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
91
            "\u001b[?25hCollecting trl\n",
92
            "  Downloading trl-0.7.1-py3-none-any.whl (117 kB)\n",
93
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m118.0/118.0 kB\u001b[0m \u001b[31m16.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
94
            "\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from accelerate) (1.23.5)\n",
95
            "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from accelerate) (23.1)\n",
96
            "Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate) (5.9.5)\n",
97
            "Requirement already satisfied: pyyaml in /usr/local/lib/python3.10/dist-packages (from accelerate) (6.0.1)\n",
98
            "Requirement already satisfied: torch>=1.10.0 in /usr/local/lib/python3.10/dist-packages (from accelerate) (2.0.1+cu118)\n",
99
            "Collecting huggingface-hub (from accelerate)\n",
100
            "  Downloading huggingface_hub-0.17.2-py3-none-any.whl (294 kB)\n",
101
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m294.9/294.9 kB\u001b[0m \u001b[31m33.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
102
            "\u001b[?25hRequirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers) (3.12.2)\n",
103
            "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (2023.6.3)\n",
104
            "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers) (2.31.0)\n",
105
            "Collecting tokenizers!=0.11.3,<0.14,>=0.11.1 (from transformers)\n",
106
            "  Downloading tokenizers-0.13.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.8 MB)\n",
107
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.8/7.8 MB\u001b[0m \u001b[31m114.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
108
            "\u001b[?25hCollecting safetensors>=0.3.1 (from transformers)\n",
109
            "  Downloading safetensors-0.3.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.3 MB)\n",
110
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m81.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
111
            "\u001b[?25hRequirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers) (4.66.1)\n",
112
            "Requirement already satisfied: pyarrow>=8.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (9.0.0)\n",
113
            "Collecting dill<0.3.8,>=0.3.0 (from datasets)\n",
114
            "  Downloading dill-0.3.7-py3-none-any.whl (115 kB)\n",
115
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m115.3/115.3 kB\u001b[0m \u001b[31m14.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
116
            "\u001b[?25hRequirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets) (1.5.3)\n",
117
            "Collecting xxhash (from datasets)\n",
118
            "  Downloading xxhash-3.3.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (194 kB)\n",
119
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m194.1/194.1 kB\u001b[0m \u001b[31m23.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
120
            "\u001b[?25hCollecting multiprocess (from datasets)\n",
121
            "  Downloading multiprocess-0.70.15-py310-none-any.whl (134 kB)\n",
122
            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.8/134.8 kB\u001b[0m \u001b[31m17.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
123
            "\u001b[?25hRequirement already satisfied: fsspec[http]<2023.9.0,>=2023.1.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (2023.6.0)\n",
124
            "Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets) (3.8.5)\n",
125
            "Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (23.1.0)\n",
126
            "Requirement already satisfied: charset-normalizer<4.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (3.2.0)\n",
127
            "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (6.0.4)\n",
128
            "Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (4.0.3)\n",
129
            "Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.9.2)\n",
130
            "Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.4.0)\n",
131
            "Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.3.1)\n",
132
            "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub->accelerate) (4.5.0)\n",
133
            "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.4)\n",
134
            "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2.0.4)\n",
135
            "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2023.7.22)\n",
136
            "Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (1.12)\n",
137
            "Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (3.1)\n",
138
            "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (3.1.2)\n",
139
            "Requirement already satisfied: triton==2.0.0 in /usr/local/lib/python3.10/dist-packages (from torch>=1.10.0->accelerate) (2.0.0)\n",
140
            "Requirement already satisfied: cmake in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch>=1.10.0->accelerate) (3.27.4.1)\n",
141
            "Requirement already satisfied: lit in /usr/local/lib/python3.10/dist-packages (from triton==2.0.0->torch>=1.10.0->accelerate) (16.0.6)\n",
142
            "Requirement already satisfied: python-dateutil>=2.8.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2.8.2)\n",
143
            "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2023.3.post1)\n",
144
            "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.1->pandas->datasets) (1.16.0)\n",
145
            "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch>=1.10.0->accelerate) (2.1.3)\n",
146
            "Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch>=1.10.0->accelerate) (1.3.0)\n",
147
            "Installing collected packages: tokenizers, safetensors, bitsandbytes, xxhash, einops, dill, multiprocess, huggingface-hub, transformers, datasets, accelerate, trl, peft\n",
148
            "Successfully installed accelerate-0.23.0 bitsandbytes-0.41.1 datasets-2.14.5 dill-0.3.7 einops-0.6.1 huggingface-hub-0.17.2 multiprocess-0.70.15 peft-0.5.0 safetensors-0.3.3 tokenizers-0.13.3 transformers-4.33.2 trl-0.7.1 xxhash-3.3.0\n"
149
          ]
150
        }
151
      ]
152
    },
153
    {
154
      "cell_type": "code",
155
      "execution_count": 3,
156
      "metadata": {
157
        "id": "rpf1Z0k4RJM6"
158
      },
159
      "outputs": [],
160
      "source": [
161
        "# !pip install -Uqqq pip --progress-bar off\n",
162
        "# !pip install -qqq torch==2.0.1 --progress-bar off\n",
163
        "# !pip install -qqq transformers==4.32.1 --progress-bar off\n",
164
        "# !pip install -qqq datasets==2.14.4 --progress-bar off\n",
165
        "# !pip install -qqq peft==0.5.0 --progress-bar off\n",
166
        "# !pip install -qqq bitsandbytes==0.41.1 --progress-bar off\n",
167
        "# !pip install -qqq trl==0.7.1 --progress-bar off"
168
      ]
169
    },
170
    {
171
      "cell_type": "code",
172
      "execution_count": 6,
173
      "metadata": {
174
        "id": "P1PG0WSvRqVq"
175
      },
176
      "outputs": [],
177
      "source": [
178
        "import json\n",
179
        "import re\n",
180
        "from pprint import pprint\n",
181
        "import os\n",
182
        "\n",
183
        "import pandas as pd\n",
184
        "import torch\n",
185
        "from datasets import Dataset, load_dataset\n",
186
        "from huggingface_hub import notebook_login\n",
187
        "from peft import LoraConfig, PeftModel, get_peft_model\n",
188
        "from transformers import (\n",
189
        "    AutoModelForCausalLM,\n",
190
        "    AutoTokenizer,\n",
191
        "    BitsAndBytesConfig,\n",
192
        "    TrainingArguments,\n",
193
        "    DataCollatorForLanguageModeling,\n",
194
        "    BitsAndBytesConfig\n",
195
        ")\n",
196
        "from trl import SFTTrainer\n",
197
        "\n",
198
        "DEVICE = \"cuda:0\" if torch.cuda.is_available() else \"cpu\"\n",
199
        "MODEL_NAME = \"microsoft/phi-1_5\""
200
      ]
201
    },
202
    {
203
      "cell_type": "markdown",
204
      "metadata": {
205
        "id": "4ixsX2Y4doEf"
206
      },
207
      "source": [
208
        "## Data"
209
      ]
210
    },
211
    {
212
      "cell_type": "code",
213
      "source": [
214
        "dataset = load_dataset(\"Salesforce/dialogstudio\", \"TweetSumm\")\n",
215
        "dataset"
216
      ],
217
      "metadata": {
218
        "colab": {
219
          "base_uri": "https://localhost:8080/"
220
        },
221
        "id": "Kc0CVTtUkWvl",
222
        "outputId": "b078c12b-4a06-49e1-f101-3fdc40a7f5dd"
223
      },
224
      "execution_count": 7,
225
      "outputs": [
226
        {
227
          "output_type": "execute_result",
228
          "data": {
229
            "text/plain": [
230
              "DatasetDict({\n",
231
              "    train: Dataset({\n",
232
              "        features: ['original dialog id', 'new dialog id', 'dialog index', 'original dialog info', 'log', 'prompt'],\n",
233
              "        num_rows: 879\n",
234
              "    })\n",
235
              "    validation: Dataset({\n",
236
              "        features: ['original dialog id', 'new dialog id', 'dialog index', 'original dialog info', 'log', 'prompt'],\n",
237
              "        num_rows: 110\n",
238
              "    })\n",
239
              "    test: Dataset({\n",
240
              "        features: ['original dialog id', 'new dialog id', 'dialog index', 'original dialog info', 'log', 'prompt'],\n",
241
              "        num_rows: 110\n",
242
              "    })\n",
243
              "})"
244
            ]
245
          },
246
          "metadata": {},
247
          "execution_count": 7
248
        }
249
      ]
250
    },
251
    {
252
      "cell_type": "code",
253
      "source": [
254
        "DEFAULT_SYSTEM_PROMPT = \"\"\"\n",
255
        "Below is a conversation between a human and an AI agent. Write a summary of the conversation.\n",
256
        "\"\"\".strip()\n",
257
        "\n",
258
        "\n",
259
        "def generate_training_prompt(\n",
260
        "    conversation: str, summary: str, system_prompt: str = DEFAULT_SYSTEM_PROMPT\n",
261
        ") -> str:\n",
262
        "    return f\"\"\"### Instruction: {system_prompt}\n",
263
        "\n",
264
        "### Input:\n",
265
        "{conversation.strip()}\n",
266
        "\n",
267
        "### Response:\n",
268
        "{summary}\n",
269
        "\"\"\".strip()"
270
      ],
271
      "metadata": {
272
        "id": "fbx71jhaMGK5"
273
      },
274
      "execution_count": 8,
275
      "outputs": []
276
    },
277
    {
278
      "cell_type": "code",
279
      "source": [
280
        "def clean_text(text):\n",
281
        "    text = re.sub(r\"http\\S+\", \"\", text)\n",
282
        "    text = re.sub(r\"@[^\\s]+\", \"\", text)\n",
283
        "    text = re.sub(r\"\\s+\", \" \", text)\n",
284
        "    return re.sub(r\"\\^[^ ]+\", \"\", text)\n",
285
        "\n",
286
        "\n",
287
        "def create_conversation_text(data_point):\n",
288
        "    text = \"\"\n",
289
        "    for item in data_point[\"log\"]:\n",
290
        "        user = clean_text(item[\"user utterance\"])\n",
291
        "        text += f\"user: {user.strip()}\\n\"\n",
292
        "\n",
293
        "        agent = clean_text(item[\"system response\"])\n",
294
        "        text += f\"agent: {agent.strip()}\\n\"\n",
295
        "\n",
296
        "    return text"
297
      ],
298
      "metadata": {
299
        "id": "gMfzUJVOR9Lr"
300
      },
301
      "execution_count": 9,
302
      "outputs": []
303
    },
304
    {
305
      "cell_type": "code",
306
      "source": [
307
        "def generate_text(data_point):\n",
308
        "    summaries = json.loads(data_point[\"original dialog info\"])[\"summaries\"][\n",
309
        "        \"abstractive_summaries\"\n",
310
        "    ]\n",
311
        "    summary = summaries[0]\n",
312
        "    summary = \" \".join(summary)\n",
313
        "\n",
314
        "    conversation_text = create_conversation_text(data_point)\n",
315
        "    return {\n",
316
        "        \"conversation\": conversation_text,\n",
317
        "        \"summary\": summary,\n",
318
        "        \"text\": generate_training_prompt(conversation_text, summary),\n",
319
        "    }"
320
      ],
321
      "metadata": {
322
        "id": "eRbskn48QNfW"
323
      },
324
      "execution_count": 10,
325
      "outputs": []
326
    },
327
    {
328
      "cell_type": "code",
329
      "source": [
330
        "example = generate_text(dataset[\"train\"][0])"
331
      ],
332
      "metadata": {
333
        "id": "J9VuGHGYSR5q"
334
      },
335
      "execution_count": 11,
336
      "outputs": []
337
    },
338
    {
339
      "cell_type": "code",
340
      "source": [
341
        "print(example[\"summary\"])"
342
      ],
343
      "metadata": {
344
        "colab": {
345
          "base_uri": "https://localhost:8080/"
346
        },
347
        "id": "ycfL7LvHSu2h",
348
        "outputId": "0ed47942-4843-4427-de4d-92f37c84504e"
349
      },
350
      "execution_count": 12,
351
      "outputs": [
352
        {
353
          "output_type": "stream",
354
          "name": "stdout",
355
          "text": [
356
            "Customer enquired about his Iphone and Apple watch which is not showing his any steps/activity and health activities. Agent is asking to move to DM and look into it.\n"
357
          ]
358
        }
359
      ]
360
    },
361
    {
362
      "cell_type": "code",
363
      "source": [
364
        "print(example[\"conversation\"])"
365
      ],
366
      "metadata": {
367
        "colab": {
368
          "base_uri": "https://localhost:8080/"
369
        },
370
        "id": "eL7EDMq_SxlJ",
371
        "outputId": "946ec8e8-58a5-4afb-abfa-49a9239097d0"
372
      },
373
      "execution_count": 13,
374
      "outputs": [
375
        {
376
          "output_type": "stream",
377
          "name": "stdout",
378
          "text": [
379
            "user: So neither my iPhone nor my Apple Watch are recording my steps/activity, and Health doesn’t recognise either source anymore for some reason. Any ideas? please read the above.\n",
380
            "agent: Let’s investigate this together. To start, can you tell us the software versions your iPhone and Apple Watch are running currently?\n",
381
            "user: My iPhone is on 11.1.2, and my watch is on 4.1.\n",
382
            "agent: Thank you. Have you tried restarting both devices since this started happening?\n",
383
            "user: I’ve restarted both, also un-paired then re-paired the watch.\n",
384
            "agent: Got it. When did you first notice that the two devices were not talking to each other. Do the two devices communicate through other apps such as Messages?\n",
385
            "user: Yes, everything seems fine, it’s just Health and activity.\n",
386
            "agent: Let’s move to DM and look into this a bit more. When reaching out in DM, let us know when this first started happening please. For example, did it start after an update or after installing a certain app?\n",
387
            "\n"
388
          ]
389
        }
390
      ]
391
    },
392
    {
393
      "cell_type": "code",
394
      "source": [
395
        "print(example[\"text\"])"
396
      ],
397
      "metadata": {
398
        "colab": {
399
          "base_uri": "https://localhost:8080/"
400
        },
401
        "id": "BbiL_o5dZZhg",
402
        "outputId": "af672c10-5160-4167-ad33-aeeea5b1ebbd"
403
      },
404
      "execution_count": 14,
405
      "outputs": [
406
        {
407
          "output_type": "stream",
408
          "name": "stdout",
409
          "text": [
410
            "### Instruction: Below is a conversation between a human and an AI agent. Write a summary of the conversation.\n",
411
            "\n",
412
            "### Input:\n",
413
            "user: So neither my iPhone nor my Apple Watch are recording my steps/activity, and Health doesn’t recognise either source anymore for some reason. Any ideas? please read the above.\n",
414
            "agent: Let’s investigate this together. To start, can you tell us the software versions your iPhone and Apple Watch are running currently?\n",
415
            "user: My iPhone is on 11.1.2, and my watch is on 4.1.\n",
416
            "agent: Thank you. Have you tried restarting both devices since this started happening?\n",
417
            "user: I’ve restarted both, also un-paired then re-paired the watch.\n",
418
            "agent: Got it. When did you first notice that the two devices were not talking to each other. Do the two devices communicate through other apps such as Messages?\n",
419
            "user: Yes, everything seems fine, it’s just Health and activity.\n",
420
            "agent: Let’s move to DM and look into this a bit more. When reaching out in DM, let us know when this first started happening please. For example, did it start after an update or after installing a certain app?\n",
421
            "\n",
422
            "### Response:\n",
423
            "Customer enquired about his Iphone and Apple watch which is not showing his any steps/activity and health activities. Agent is asking to move to DM and look into it.\n"
424
          ]
425
        }
426
      ]
427
    },
428
    {
429
      "cell_type": "code",
430
      "source": [
431
        "def process_dataset(data: Dataset):\n",
432
        "    return (\n",
433
        "        data.shuffle(seed=42)\n",
434
        "        .map(generate_text)\n",
435
        "        .remove_columns(\n",
436
        "            [\n",
437
        "                \"original dialog id\",\n",
438
        "                \"new dialog id\",\n",
439
        "                \"dialog index\",\n",
440
        "                \"original dialog info\",\n",
441
        "                \"log\",\n",
442
        "                \"prompt\",\n",
443
        "            ]\n",
444
        "        )\n",
445
        "    )"
446
      ],
447
      "metadata": {
448
        "id": "jKidKeUpZkPb"
449
      },
450
      "execution_count": 15,
451
      "outputs": []
452
    },
453
    {
454
      "cell_type": "code",
455
      "source": [
456
        "dataset[\"train\"] = process_dataset(dataset[\"train\"])\n",
457
        "dataset[\"validation\"] = process_dataset(dataset[\"validation\"])\n",
458
        "dataset[\"test\"] = process_dataset(dataset[\"test\"])"
459
      ],
460
      "metadata": {
461
        "id": "XHy1pVjlaLtm"
462
      },
463
      "execution_count": 16,
464
      "outputs": []
465
    },
466
    {
467
      "cell_type": "markdown",
468
      "metadata": {
469
        "id": "usDeQuT2Wssl"
470
      },
471
      "source": [
472
        "## Model"
473
      ]
474
    },
475
    {
476
      "cell_type": "code",
477
      "execution_count": 24,
478
      "metadata": {
479
        "colab": {
480
          "base_uri": "https://localhost:8080/",
481
          "height": 145,
482
          "referenced_widgets": [
483
            "96ef5be98b5c4f2c9945b1a8c0989d7b",
484
            "29aca8e4365b4bee99d5292d8e74cdd6",
485
            "c83294f6ba864858a05d5222d84eb0c3",
486
            "7254587396ba4701835ee666ee3b697b",
487
            "896def48ce8148f18a13b0a46d0919b3",
488
            "5bce118ef58b43b6ab295e6272d84668",
489
            "a68cf26cf964423b8ce413bc6c8c5299",
490
            "ed2f736177914d2abb1c2efb6ecce6bb",
491
            "6c2ff22a40b543b6ac26ccd2b7298a61",
492
            "bb5fc1bf3f4c465e8b0846f22e71a23b",
493
            "42cae2119e5e49b9b7250a6f96f373bc",
494
            "8701e3ece5b04773a157dacc8f793374",
495
            "b3b75ce135e049bbacd598eac3d579ce",
496
            "6bb60bf24297418384b709e106c6c71a",
497
            "4b209751747c4ff98d905702b4ba3ab6",
498
            "ca3fcc5229864c2d8030b8e1bce3680a",
499
            "e43a98b2e5ba41a5a483c9320f982960",
500
            "f18eecc689234406a32b478a88379011",
501
            "dc6a98f4481a4d158ffd66d036d9d391",
502
            "c3e8d37c64af4b1eaed0569fd32c3841",
503
            "2cf7de58a08f4a10a0388fd5284adc61",
504
            "3e55c582114c43d19f9a88819739d9a5",
505
            "cdd259b528bf4cd7b1c2f834cec0372d",
506
            "1440bf6528a844f399aea3997b0348ba",
507
            "60af265316074adab78687ac53070910",
508
            "1c9d8afeb2644c65909f6e689e1af0af",
509
            "06d7ce85d9784f58add0583feda74530",
510
            "bcacfb2e6c464423b5e8bc0aef675fdd",
511
            "88c5cc8d66d8408cbe2bfedb365723f3",
512
            "814bac58a4974f70b17b5e19f88b042f",
513
            "3502bced8abc4cfc87300881857c4e08",
514
            "c726307cdc3c4598ad45879f3f29e60c"
515
          ]
516
        },
517
        "id": "3cLg8cYCdv74",
518
        "outputId": "b602a1eb-af6c-4069-a8f0-ee389e86ea38"
519
      },
520
      "outputs": [
521
        {
522
          "output_type": "display_data",
523
          "data": {
524
            "text/plain": [
525
              "VBox(children=(HTML(value='<center> <img\\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.sv…"
526
            ],
527
            "application/vnd.jupyter.widget-view+json": {
528
              "version_major": 2,
529
              "version_minor": 0,
530
              "model_id": "96ef5be98b5c4f2c9945b1a8c0989d7b"
531
            }
532
          },
533
          "metadata": {}
534
        }
535
      ],
536
      "source": [
537
        "notebook_login()"
538
      ]
539
    },
540
    {
541
      "cell_type": "code",
542
      "execution_count": 16,
543
      "metadata": {
544
        "id": "GwxKEVnKWWss"
545
      },
546
      "outputs": [],
547
      "source": [
548
        "def create_model_and_tokenizer():\n",
549
        "    bnb_config = BitsAndBytesConfig(\n",
550
        "        load_in_4bit=True,\n",
551
        "        bnb_4bit_use_double_quant=True,\n",
552
        "        bnb_4bit_quant_type=\"nf4\",\n",
553
        "        bnb_4bit_compute_dtype=torch.float16,\n",
554
        "    )\n",
555
        "\n",
556
        "    model = AutoModelForCausalLM.from_pretrained(\n",
557
        "        MODEL_NAME,\n",
558
        "        device_map={\"\":0},\n",
559
        "        trust_remote_code=True,\n",
560
        "        quantization_config=bnb_config\n",
561
        "    )\n",
562
        "\n",
563
        "    tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)\n",
564
        "    tokenizer.pad_token = tokenizer.eos_token\n",
565
        "\n",
566
        "    return model, tokenizer"
567
      ]
568
    },
569
    {
570
      "cell_type": "code",
571
      "execution_count": 17,
572
      "metadata": {
573
        "colab": {
574
          "base_uri": "https://localhost:8080/",
575
          "height": 473,
576
          "referenced_widgets": [
577
            "ee3793650a24458c8f1c9da6f6cf7930",
578
            "db88e2bb13fa425aaccc2f7a32f2a946",
579
            "9f1b94961d43444697b621f5f2a80392",
580
            "bfa4594314d6437994f2cb57311d97a6",
581
            "dd13edfc70174149b25a15b0858ba61c",
582
            "2e0685af66bb4e52b72b8e0159df3531",
583
            "0d86661bee2d497fa856892c6b6f3f46",
584
            "94916f236b0d4e8a8733871e84df1147",
585
            "97d6e28ba91e45cd899719bb5bc2b6ab",
586
            "118f1b7073b847ef987036cd82499d0b",
587
            "dd77325d1d8d417eb6544ae0cbc15133",
588
            "794c3466fdc34e549aaefbc106537e16",
589
            "cb4a5c788e9d44818ff61e2551ed750e",
590
            "fec4fa9c00d6429791bceeccc053bc05",
591
            "fef1d4090bcf4d77895d45567bb1ff41",
592
            "06a0a6459ff14187acac58481400bf05",
593
            "6caf5b09e0f44382807c41193a2963d3",
594
            "6c95ad4f7ae24185a3fa9dbf9f8f68a2",
595
            "69b2fdbe3a5e4682963987fb914afec5",
596
            "38e5964aa7a744439c7e5ad26c162ead",
597
            "8f1d717eba6942b8aca16cbc49bc6a6f",
598
            "0168b508956141269412e88990ee3d67",
599
            "e8b48f5b7e2b4d8d9407cb667092a3e8",
600
            "8b1317e6869e439092c1d880137f62fd",
601
            "72a199e2dc1b4d63984493e6bf1bdb8c",
602
            "2296ca45af0c4cec80d01fb7e33f278f",
603
            "3dd72eb426fa4e6e919276bb4e91f60f",
604
            "2d01ed4a650c4bcf9d07f020ae98081d",
605
            "51ac6641cd1441998abadc1993d4ef96",
606
            "520db9e6803d48fca60b1063e10cf260",
607
            "677f54e2735f407088724a38212c0171",
608
            "49fd03a8e4954f5caf410898882324c8",
609
            "63e68a09d85a4afd90d125bc61983d7a",
610
            "3672b47a27d64466995731f7475dff05",
611
            "27905804572740018fa7c00a6de8e82d",
612
            "dd8375f821bd4283b3f906aea5c23d07",
613
            "a9f84e0028e440828def8cee6ae317ee",
614
            "0c068bce19d74f7b835c90221a1cde38",
615
            "f9df8cdf043a4aaab82d55f24c17a3d8",
616
            "4efaf38f2eaa46799c2afecb55ccf14c",
617
            "498424778ff94f7ea6e6f32e8cd95868",
618
            "6b654ce3193745208af00288d6f9d5f9",
619
            "681653beca9b4a6591f7008e0ff5ac3b",
620
            "997bd19e08ff48bc92a83487598be156",
621
            "27e56e4591da430fb5f62b5d49df7e9e",
622
            "b90e6e929c164e3384cb0067555f66a4",
623
            "5fb49e2af10d452c9558f6f2b7551b16",
624
            "a6547c497b5b44b59c1de056965de351",
625
            "8732438e1da948e6a4f74cde7a25eb57",
626
            "cdd90757935f45668a81520522e3f057",
627
            "aa2269ddef7f4e66a42973e5fd3e568f",
628
            "a9d745f127214a4289bf880d65899dd3",
629
            "90884fd8a8d24859b4f94aac4041cfe4",
630
            "0fced73c513242fabd2fc4eb30df1e21",
631
            "22d1d55d6580458fb8fdb4af38ec4690",
632
            "a4acb6dc90144e729a615bb9b6e2db55",
633
            "3bc8f617a46e47fb8676ffee9cc25fba",
634
            "fe82a3b74c5b4f79aa367fe5d8f79345",
635
            "387d62eb068e44619908b006079eacd7",
636
            "e6d16b50198a450c876640e34d17140e",
637
            "b4a34fe788034852876cc1886c28042f",
638
            "265d6ad184a74be9b9e8d7378bb98f8d",
639
            "e25b91678ed246cd997cec87e918c079",
640
            "7bf39b13ce4148ca8fe508c73b63e413",
641
            "b0e8f79bf6b74f08801f385b4c7aadee",
642
            "8a8d6a4614e14aaeb03e4bfa9b8a0741",
643
            "f14e8afa14b74002af2be74b84d8b033",
644
            "17cc56f07af34e588c3d3e0cdba0b458",
645
            "9439477ef5b64c1ba5c517d76c2c460f",
646
            "fc8787cef48c4befae588efa56f99adc",
647
            "fd97aec74a1148b0b94de3f2194a0558",
648
            "cf54b45acb1d40d4a34189e76ffa831c",
649
            "1cbd0d65bcf9496c85e07225be76ffdf",
650
            "4689e3a07503492eb11986bf5e8a864f",
651
            "4d443929f61f4991bc88caeb94adaaa3",
652
            "9f60e630e47841ba91855613da83e295",
653
            "12332fa62a8f4b6f974eb37bf8eddaf2",
654
            "e333b53d363b47648ab6694e25b68ad7",
655
            "5e9ebdfb88fa413b88fdf2dd5bc2a3a1",
656
            "058ff0fedb9545199d11930a9aa1deec",
657
            "6996b093bc5a4ba385dfd134f687e8db",
658
            "e1a107dbb4784261b608c382895e7daf",
659
            "73ef312d625542ccaf7994e9300acb1b",
660
            "541a328e5cb84163a1295eeee4494d3f",
661
            "db228a2b64c148d98f5db9bfbf2ac5af",
662
            "85455342596f4e90b98cc41da60b8cb6",
663
            "22b767cd81db4953959e78d71f604dce",
664
            "9fb8334f33e84dc3a4bb3deaf1e7777c",
665
            "f6ee0db62fe14f1e86c972a4a157e315",
666
            "f57698a07edd4a43b0b1f55e0d6b4a02",
667
            "9adaf92c8acf4b7ea94e5591cfe27707",
668
            "f1d7c8a0a78041b184d64a69f7ed0789",
669
            "f4ca5f16039b4258b9c83768d211e757",
670
            "864288a708f545629900a29fb05f3d8b",
671
            "746c0bfc3d90446ca10a16d7838441aa",
672
            "889a67c857fe40c89d0d8e523a66ae08",
673
            "f66ce8552d5d4355b90e934a1c8c04cd",
674
            "0c3a38f76e6841a38f7a0e545c9c4211",
675
            "e75c5a29c59747dda108212a336c7e2c",
676
            "ce6b953129c945c7a7066d0f07385c92",
677
            "6c5a70913c6542be93085a3eefb2b1ce",
678
            "bd5a93537e9d49ec86233397c0ec2a6f",
679
            "36fad39ecf0347079291103b73c3f6dd",
680
            "14f4fc13863648599cef5b830ab1bd9f",
681
            "4212106d48a34279a45890b62879ec87",
682
            "2bee159b595643619607aa10b45c186f",
683
            "c2502539d4eb413da194fae615d6e6bf",
684
            "95ab78e1349d466d90df3390c0a6ceff",
685
            "9ca4b24b9dbb4b5a9af5897c46069c49",
686
            "5e5449f0eda34f29903b59ca07ac189f",
687
            "cae6be4ca33c48acb53cfcad9cbad985",
688
            "985bd9a745764ceab05a8e665eefe591",
689
            "548672800a5b4e5ca72df6d63e01f9d3",
690
            "62b898efd2ed4810bc8bc7de4e7feebf",
691
            "8de7a61d323e4914901a7cf62a916a07",
692
            "9ee95e5cee6d444588116346f6acedf2",
693
            "9baed57a94ed47e493fa23eb65c2526b",
694
            "1f3a418ebb47456ea041d7b5b3cf85d5",
695
            "fc0ff589460d47e5b97f745b748dd136",
696
            "b55ef28dff8b4b14b5b2cbf0438f8e44",
697
            "8be7a69bd51b448da2111a21822b7482"
698
          ]
699
        },
700
        "id": "qDVlGrUmdzdh",
701
        "outputId": "d068211c-3c4f-437e-855e-a4e721997466"
702
      },
703
      "outputs": [
704
        {
705
          "output_type": "display_data",
706
          "data": {
707
            "text/plain": [
708
              "Downloading (…)lve/main/config.json:   0%|          | 0.00/880 [00:00<?, ?B/s]"
709
            ],
710
            "application/vnd.jupyter.widget-view+json": {
711
              "version_major": 2,
712
              "version_minor": 0,
713
              "model_id": "ee3793650a24458c8f1c9da6f6cf7930"
714
            }
715
          },
716
          "metadata": {}
717
        },
718
        {
719
          "output_type": "display_data",
720
          "data": {
721
            "text/plain": [
722
              "Downloading (…)former_sequential.py:   0%|          | 0.00/2.23k [00:00<?, ?B/s]"
723
            ],
724
            "application/vnd.jupyter.widget-view+json": {
725
              "version_major": 2,
726
              "version_minor": 0,
727
              "model_id": "794c3466fdc34e549aaefbc106537e16"
728
            }
729
          },
730
          "metadata": {}
731
        },
732
        {
733
          "output_type": "stream",
734
          "name": "stderr",
735
          "text": [
736
            "A new version of the following files was downloaded from https://huggingface.co/microsoft/phi-1_5:\n",
737
            "- configuration_mixformer_sequential.py\n",
738
            ". Make sure to double-check they do not contain any added malicious code. To avoid downloading new versions of the code file, you can pin a revision.\n"
739
          ]
740
        },
741
        {
742
          "output_type": "display_data",
743
          "data": {
744
            "text/plain": [
745
              "Downloading (…)former_sequential.py:   0%|          | 0.00/32.2k [00:00<?, ?B/s]"
746
            ],
747
            "application/vnd.jupyter.widget-view+json": {
748
              "version_major": 2,
749
              "version_minor": 0,
750
              "model_id": "e8b48f5b7e2b4d8d9407cb667092a3e8"
751
            }
752
          },
753
          "metadata": {}
754
        },
755
        {
756
          "output_type": "stream",
757
          "name": "stderr",
758
          "text": [
759
            "A new version of the following files was downloaded from https://huggingface.co/microsoft/phi-1_5:\n",
760
            "- modeling_mixformer_sequential.py\n",
761
            ". Make sure to double-check they do not contain any added malicious code. To avoid downloading new versions of the code file, you can pin a revision.\n"
762
          ]
763
        },
764
        {
765
          "output_type": "display_data",
766
          "data": {
767
            "text/plain": [
768
              "Downloading pytorch_model.bin:   0%|          | 0.00/2.84G [00:00<?, ?B/s]"
769
            ],
770
            "application/vnd.jupyter.widget-view+json": {
771
              "version_major": 2,
772
              "version_minor": 0,
773
              "model_id": "3672b47a27d64466995731f7475dff05"
774
            }
775
          },
776
          "metadata": {}
777
        },
778
        {
779
          "output_type": "display_data",
780
          "data": {
781
            "text/plain": [
782
              "Downloading (…)neration_config.json:   0%|          | 0.00/69.0 [00:00<?, ?B/s]"
783
            ],
784
            "application/vnd.jupyter.widget-view+json": {
785
              "version_major": 2,
786
              "version_minor": 0,
787
              "model_id": "27e56e4591da430fb5f62b5d49df7e9e"
788
            }
789
          },
790
          "metadata": {}
791
        },
792
        {
793
          "output_type": "display_data",
794
          "data": {
795
            "text/plain": [
796
              "Downloading (…)okenizer_config.json:   0%|          | 0.00/237 [00:00<?, ?B/s]"
797
            ],
798
            "application/vnd.jupyter.widget-view+json": {
799
              "version_major": 2,
800
              "version_minor": 0,
801
              "model_id": "a4acb6dc90144e729a615bb9b6e2db55"
802
            }
803
          },
804
          "metadata": {}
805
        },
806
        {
807
          "output_type": "display_data",
808
          "data": {
809
            "text/plain": [
810
              "Downloading (…)olve/main/vocab.json:   0%|          | 0.00/798k [00:00<?, ?B/s]"
811
            ],
812
            "application/vnd.jupyter.widget-view+json": {
813
              "version_major": 2,
814
              "version_minor": 0,
815
              "model_id": "f14e8afa14b74002af2be74b84d8b033"
816
            }
817
          },
818
          "metadata": {}
819
        },
820
        {
821
          "output_type": "display_data",
822
          "data": {
823
            "text/plain": [
824
              "Downloading (…)olve/main/merges.txt:   0%|          | 0.00/456k [00:00<?, ?B/s]"
825
            ],
826
            "application/vnd.jupyter.widget-view+json": {
827
              "version_major": 2,
828
              "version_minor": 0,
829
              "model_id": "e333b53d363b47648ab6694e25b68ad7"
830
            }
831
          },
832
          "metadata": {}
833
        },
834
        {
835
          "output_type": "display_data",
836
          "data": {
837
            "text/plain": [
838
              "Downloading (…)/main/tokenizer.json:   0%|          | 0.00/2.11M [00:00<?, ?B/s]"
839
            ],
840
            "application/vnd.jupyter.widget-view+json": {
841
              "version_major": 2,
842
              "version_minor": 0,
843
              "model_id": "f6ee0db62fe14f1e86c972a4a157e315"
844
            }
845
          },
846
          "metadata": {}
847
        },
848
        {
849
          "output_type": "display_data",
850
          "data": {
851
            "text/plain": [
852
              "Downloading (…)in/added_tokens.json:   0%|          | 0.00/1.08k [00:00<?, ?B/s]"
853
            ],
854
            "application/vnd.jupyter.widget-view+json": {
855
              "version_major": 2,
856
              "version_minor": 0,
857
              "model_id": "ce6b953129c945c7a7066d0f07385c92"
858
            }
859
          },
860
          "metadata": {}
861
        },
862
        {
863
          "output_type": "display_data",
864
          "data": {
865
            "text/plain": [
866
              "Downloading (…)cial_tokens_map.json:   0%|          | 0.00/99.0 [00:00<?, ?B/s]"
867
            ],
868
            "application/vnd.jupyter.widget-view+json": {
869
              "version_major": 2,
870
              "version_minor": 0,
871
              "model_id": "cae6be4ca33c48acb53cfcad9cbad985"
872
            }
873
          },
874
          "metadata": {}
875
        }
876
      ],
877
      "source": [
878
        "model, tokenizer = create_model_and_tokenizer()\n",
879
        "model.config.use_cache = False"
880
      ]
881
    },
882
    {
883
      "cell_type": "code",
884
      "execution_count": 18,
885
      "metadata": {
886
        "colab": {
887
          "base_uri": "https://localhost:8080/"
888
        },
889
        "id": "DRubXChbe7pL",
890
        "outputId": "41c5c6ca-e714-4cdb-fb33-42be895eb19d"
891
      },
892
      "outputs": [
893
        {
894
          "output_type": "execute_result",
895
          "data": {
896
            "text/plain": [
897
              "{'quant_method': <QuantizationMethod.BITS_AND_BYTES: 'bitsandbytes'>,\n",
898
              " 'load_in_8bit': False,\n",
899
              " 'load_in_4bit': True,\n",
900
              " 'llm_int8_threshold': 6.0,\n",
901
              " 'llm_int8_skip_modules': None,\n",
902
              " 'llm_int8_enable_fp32_cpu_offload': False,\n",
903
              " 'llm_int8_has_fp16_weight': False,\n",
904
              " 'bnb_4bit_quant_type': 'nf4',\n",
905
              " 'bnb_4bit_use_double_quant': True,\n",
906
              " 'bnb_4bit_compute_dtype': 'float16'}"
907
            ]
908
          },
909
          "metadata": {},
910
          "execution_count": 18
911
        }
912
      ],
913
      "source": [
914
        "model.config.quantization_config.to_dict()"
915
      ]
916
    },
917
    {
918
      "cell_type": "code",
919
      "execution_count": 19,
920
      "metadata": {
921
        "id": "1Sj65mDxNeJv"
922
      },
923
      "outputs": [],
924
      "source": [
925
        "peft_config = LoraConfig(\n",
926
        "    r=16,\n",
927
        "    lora_alpha=16,\n",
928
        "    target_modules=[\"Wqkv\", \"out_proj\"],\n",
929
        "    lora_dropout=0.05,\n",
930
        "    bias=\"none\",\n",
931
        "    task_type=\"CAUSAL_LM\"\n",
932
        ")"
933
      ]
934
    },
935
    {
936
      "cell_type": "code",
937
      "source": [
938
        "model = get_peft_model(model, peft_config)\n",
939
        "model.print_trainable_parameters()"
940
      ],
941
      "metadata": {
942
        "colab": {
943
          "base_uri": "https://localhost:8080/"
944
        },
945
        "id": "Vv11jEAJT9Pp",
946
        "outputId": "83cb3d0e-df99-4dad-f46a-cd19fe571130"
947
      },
948
      "execution_count": 20,
949
      "outputs": [
950
        {
951
          "output_type": "stream",
952
          "name": "stdout",
953
          "text": [
954
            "trainable params: 4,718,592 || all params: 1,422,989,312 || trainable%: 0.3315971497613047\n"
955
          ]
956
        }
957
      ]
958
    },
959
    {
960
      "cell_type": "markdown",
961
      "metadata": {
962
        "id": "vVSLIcQl8g9h"
963
      },
964
      "source": [
965
        "## Training"
966
      ]
967
    },
968
    {
969
      "cell_type": "code",
970
      "execution_count": 21,
971
      "metadata": {
972
        "colab": {
973
          "base_uri": "https://localhost:8080/",
974
          "height": 821
975
        },
976
        "id": "0FoXB0psS8hN",
977
        "outputId": "10d07019-3644-4b3f-8eff-230c7dba6af0"
978
      },
979
      "outputs": [
980
        {
981
          "output_type": "display_data",
982
          "data": {
983
            "text/plain": [
984
              "<IPython.core.display.Javascript object>"
985
            ],
986
            "application/javascript": [
987
              "\n",
988
              "        (async () => {\n",
989
              "            const url = new URL(await google.colab.kernel.proxyPort(6006, {'cache': true}));\n",
990
              "            url.searchParams.set('tensorboardColab', 'true');\n",
991
              "            const iframe = document.createElement('iframe');\n",
992
              "            iframe.src = url;\n",
993
              "            iframe.setAttribute('width', '100%');\n",
994
              "            iframe.setAttribute('height', '800');\n",
995
              "            iframe.setAttribute('frameborder', 0);\n",
996
              "            document.body.appendChild(iframe);\n",
997
              "        })();\n",
998
              "    "
999
            ]
1000
          },
1001
          "metadata": {}
1002
        }
1003
      ],
1004
      "source": [
1005
        "OUTPUT_DIR = \"experiments\"\n",
1006
        "\n",
1007
        "%load_ext tensorboard\n",
1008
        "%tensorboard --logdir experiments/runs"
1009
      ]
1010
    },
1011
    {
1012
      "cell_type": "code",
1013
      "execution_count": 22,
1014
      "metadata": {
1015
        "id": "gIoe9TqOof-V"
1016
      },
1017
      "outputs": [],
1018
      "source": [
1019
        "training_arguments = TrainingArguments(\n",
1020
        "        output_dir=\"phi-1_5-finetuned-dialogstudio\",\n",
1021
        "        per_device_train_batch_size=4,\n",
1022
        "        gradient_accumulation_steps=1,\n",
1023
        "        learning_rate=2e-4,\n",
1024
        "        lr_scheduler_type=\"cosine\",\n",
1025
        "        save_strategy=\"epoch\",\n",
1026
        "        logging_steps=1,\n",
1027
        "        max_steps=3,\n",
1028
        "        num_train_epochs=1,\n",
1029
        "        push_to_hub=True\n",
1030
        "    )"
1031
      ]
1032
    },
1033
    {
1034
      "cell_type": "code",
1035
      "execution_count": 25,
1036
      "metadata": {
1037
        "colab": {
1038
          "base_uri": "https://localhost:8080/"
1039
        },
1040
        "id": "ZL4Qa_cypL1f",
1041
        "outputId": "7d3c3821-8395-407c-8f95-1dbd1d479efb"
1042
      },
1043
      "outputs": [
1044
        {
1045
          "output_type": "stream",
1046
          "name": "stderr",
1047
          "text": [
1048
            "/usr/local/lib/python3.10/dist-packages/trl/trainer/sft_trainer.py:166: UserWarning: You didn't pass a `max_seq_length` argument to the SFTTrainer, this will default to 1024\n",
1049
            "  warnings.warn(\n"
1050
          ]
1051
        }
1052
      ],
1053
      "source": [
1054
        "trainer = SFTTrainer(\n",
1055
        "    model=model,\n",
1056
        "    train_dataset=dataset[\"train\"],\n",
1057
        "    eval_dataset=dataset[\"validation\"],\n",
1058
        "    peft_config=peft_config,\n",
1059
        "    dataset_text_field=\"text\",\n",
1060
        "    tokenizer=tokenizer,\n",
1061
        "    args=training_arguments,\n",
1062
        ")"
1063
      ]
1064
    },
1065
    {
1066
      "cell_type": "code",
1067
      "source": [
1068
        "trainer.train()"
1069
      ],
1070
      "metadata": {
1071
        "colab": {
1072
          "base_uri": "https://localhost:8080/",
1073
          "height": 241
1074
        },
1075
        "id": "y7LDwR6kJdkO",
1076
        "outputId": "e22ee88f-7c55-4251-8a3e-22bf75e5c777"
1077
      },
1078
      "execution_count": 26,
1079
      "outputs": [
1080
        {
1081
          "output_type": "stream",
1082
          "name": "stderr",
1083
          "text": [
1084
            "You're using a CodeGenTokenizerFast tokenizer. Please note that with a fast tokenizer, using the `__call__` method is faster than using a method to encode the text followed by a call to the `pad` method to get a padded encoding.\n"
1085
          ]
1086
        },
1087
        {
1088
          "output_type": "display_data",
1089
          "data": {
1090
            "text/plain": [
1091
              "<IPython.core.display.HTML object>"
1092
            ],
1093
            "text/html": [
1094
              "\n",
1095
              "    <div>\n",
1096
              "      \n",
1097
              "      <progress value='3' max='3' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
1098
              "      [3/3 00:02, Epoch 0/1]\n",
1099
              "    </div>\n",
1100
              "    <table border=\"1\" class=\"dataframe\">\n",
1101
              "  <thead>\n",
1102
              " <tr style=\"text-align: left;\">\n",
1103
              "      <th>Step</th>\n",
1104
              "      <th>Training Loss</th>\n",
1105
              "    </tr>\n",
1106
              "  </thead>\n",
1107
              "  <tbody>\n",
1108
              "    <tr>\n",
1109
              "      <td>1</td>\n",
1110
              "      <td>3.080800</td>\n",
1111
              "    </tr>\n",
1112
              "    <tr>\n",
1113
              "      <td>2</td>\n",
1114
              "      <td>2.887100</td>\n",
1115
              "    </tr>\n",
1116
              "    <tr>\n",
1117
              "      <td>3</td>\n",
1118
              "      <td>3.302700</td>\n",
1119
              "    </tr>\n",
1120
              "  </tbody>\n",
1121
              "</table><p>"
1122
            ]
1123
          },
1124
          "metadata": {}
1125
        },
1126
        {
1127
          "output_type": "execute_result",
1128
          "data": {
1129
            "text/plain": [
1130
              "TrainOutput(global_step=3, training_loss=3.090197483698527, metrics={'train_runtime': 7.7717, 'train_samples_per_second': 1.544, 'train_steps_per_second': 0.386, 'total_flos': 22418657574912.0, 'train_loss': 3.090197483698527, 'epoch': 0.01})"
1131
            ]
1132
          },
1133
          "metadata": {},
1134
          "execution_count": 26
1135
        }
1136
      ]
1137
    },
1138
    {
1139
      "cell_type": "code",
1140
      "source": [
1141
        "trainer.evaluate()"
1142
      ],
1143
      "metadata": {
1144
        "colab": {
1145
          "base_uri": "https://localhost:8080/",
1146
          "height": 124
1147
        },
1148
        "id": "IRiQABpzeom6",
1149
        "outputId": "4e1c2f58-5f5f-4322-86a7-6df3a779223a"
1150
      },
1151
      "execution_count": 27,
1152
      "outputs": [
1153
        {
1154
          "output_type": "display_data",
1155
          "data": {
1156
            "text/plain": [
1157
              "<IPython.core.display.HTML object>"
1158
            ],
1159
            "text/html": [
1160
              "\n",
1161
              "    <div>\n",
1162
              "      \n",
1163
              "      <progress value='14' max='14' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
1164
              "      [14/14 00:11]\n",
1165
              "    </div>\n",
1166
              "    "
1167
            ]
1168
          },
1169
          "metadata": {}
1170
        },
1171
        {
1172
          "output_type": "execute_result",
1173
          "data": {
1174
            "text/plain": [
1175
              "{'eval_loss': 3.243016242980957,\n",
1176
              " 'eval_runtime': 12.0781,\n",
1177
              " 'eval_samples_per_second': 9.107,\n",
1178
              " 'eval_steps_per_second': 1.159,\n",
1179
              " 'epoch': 0.01}"
1180
            ]
1181
          },
1182
          "metadata": {},
1183
          "execution_count": 27
1184
        }
1185
      ]
1186
    },
1187
    {
1188
      "cell_type": "code",
1189
      "source": [
1190
        "trainer.push_to_hub()"
1191
      ],
1192
      "metadata": {
1193
        "colab": {
1194
          "base_uri": "https://localhost:8080/",
1195
          "height": 35
1196
        },
1197
        "id": "ZCBJa6mZaSv7",
1198
        "outputId": "7111feef-c4e3-4330-b291-437c19c41c33"
1199
      },
1200
      "execution_count": 28,
1201
      "outputs": [
1202
        {
1203
          "output_type": "execute_result",
1204
          "data": {
1205
            "text/plain": [
1206
              "'https://huggingface.co/ashishpatel26/phi-1_5-finetuned-dialogstudio/tree/main/'"
1207
            ],
1208
            "application/vnd.google.colaboratory.intrinsic+json": {
1209
              "type": "string"
1210
            }
1211
          },
1212
          "metadata": {},
1213
          "execution_count": 28
1214
        }
1215
      ]
1216
    },
1217
    {
1218
      "cell_type": "code",
1219
      "source": [
1220
        "trainer.save_model(\"phi-1_5-finetuned-dialogstudio\")"
1221
      ],
1222
      "metadata": {
1223
        "id": "jJdkDvxKOq8P"
1224
      },
1225
      "execution_count": 30,
1226
      "outputs": []
1227
    },
1228
    {
1229
      "cell_type": "code",
1230
      "execution_count": 30,
1231
      "metadata": {
1232
        "colab": {
1233
          "base_uri": "https://localhost:8080/"
1234
        },
1235
        "id": "WywDQRmGEVOJ",
1236
        "outputId": "acdd8465-32e1-4fc1-ad75-06831edf8d85"
1237
      },
1238
      "outputs": [
1239
        {
1240
          "output_type": "execute_result",
1241
          "data": {
1242
            "text/plain": [
1243
              "PeftModelForCausalLM(\n",
1244
              "  (base_model): LoraModel(\n",
1245
              "    (model): MixFormerSequentialForCausalLM(\n",
1246
              "      (layers): Sequential(\n",
1247
              "        (0): Embedding(\n",
1248
              "          (wte): Embedding(51200, 2048)\n",
1249
              "          (drop): Dropout(p=0.0, inplace=False)\n",
1250
              "        )\n",
1251
              "        (1): ParallelBlock(\n",
1252
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1253
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1254
              "          (mixer): MHA(\n",
1255
              "            (rotary_emb): RotaryEmbedding()\n",
1256
              "            (Wqkv): Linear4bit(\n",
1257
              "              in_features=2048, out_features=6144, bias=True\n",
1258
              "              (lora_dropout): ModuleDict(\n",
1259
              "                (default): Dropout(p=0.05, inplace=False)\n",
1260
              "              )\n",
1261
              "              (lora_A): ModuleDict(\n",
1262
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1263
              "              )\n",
1264
              "              (lora_B): ModuleDict(\n",
1265
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1266
              "              )\n",
1267
              "              (lora_embedding_A): ParameterDict()\n",
1268
              "              (lora_embedding_B): ParameterDict()\n",
1269
              "            )\n",
1270
              "            (out_proj): Linear4bit(\n",
1271
              "              in_features=2048, out_features=2048, bias=True\n",
1272
              "              (lora_dropout): ModuleDict(\n",
1273
              "                (default): Dropout(p=0.05, inplace=False)\n",
1274
              "              )\n",
1275
              "              (lora_A): ModuleDict(\n",
1276
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1277
              "              )\n",
1278
              "              (lora_B): ModuleDict(\n",
1279
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1280
              "              )\n",
1281
              "              (lora_embedding_A): ParameterDict()\n",
1282
              "              (lora_embedding_B): ParameterDict()\n",
1283
              "            )\n",
1284
              "            (inner_attn): SelfAttention(\n",
1285
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1286
              "            )\n",
1287
              "            (inner_cross_attn): CrossAttention(\n",
1288
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1289
              "            )\n",
1290
              "          )\n",
1291
              "          (mlp): MLP(\n",
1292
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1293
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1294
              "            (act): NewGELUActivation()\n",
1295
              "          )\n",
1296
              "        )\n",
1297
              "        (2): ParallelBlock(\n",
1298
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1299
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1300
              "          (mixer): MHA(\n",
1301
              "            (rotary_emb): RotaryEmbedding()\n",
1302
              "            (Wqkv): Linear4bit(\n",
1303
              "              in_features=2048, out_features=6144, bias=True\n",
1304
              "              (lora_dropout): ModuleDict(\n",
1305
              "                (default): Dropout(p=0.05, inplace=False)\n",
1306
              "              )\n",
1307
              "              (lora_A): ModuleDict(\n",
1308
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1309
              "              )\n",
1310
              "              (lora_B): ModuleDict(\n",
1311
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1312
              "              )\n",
1313
              "              (lora_embedding_A): ParameterDict()\n",
1314
              "              (lora_embedding_B): ParameterDict()\n",
1315
              "            )\n",
1316
              "            (out_proj): Linear4bit(\n",
1317
              "              in_features=2048, out_features=2048, bias=True\n",
1318
              "              (lora_dropout): ModuleDict(\n",
1319
              "                (default): Dropout(p=0.05, inplace=False)\n",
1320
              "              )\n",
1321
              "              (lora_A): ModuleDict(\n",
1322
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1323
              "              )\n",
1324
              "              (lora_B): ModuleDict(\n",
1325
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1326
              "              )\n",
1327
              "              (lora_embedding_A): ParameterDict()\n",
1328
              "              (lora_embedding_B): ParameterDict()\n",
1329
              "            )\n",
1330
              "            (inner_attn): SelfAttention(\n",
1331
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1332
              "            )\n",
1333
              "            (inner_cross_attn): CrossAttention(\n",
1334
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1335
              "            )\n",
1336
              "          )\n",
1337
              "          (mlp): MLP(\n",
1338
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1339
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1340
              "            (act): NewGELUActivation()\n",
1341
              "          )\n",
1342
              "        )\n",
1343
              "        (3): ParallelBlock(\n",
1344
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1345
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1346
              "          (mixer): MHA(\n",
1347
              "            (rotary_emb): RotaryEmbedding()\n",
1348
              "            (Wqkv): Linear4bit(\n",
1349
              "              in_features=2048, out_features=6144, bias=True\n",
1350
              "              (lora_dropout): ModuleDict(\n",
1351
              "                (default): Dropout(p=0.05, inplace=False)\n",
1352
              "              )\n",
1353
              "              (lora_A): ModuleDict(\n",
1354
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1355
              "              )\n",
1356
              "              (lora_B): ModuleDict(\n",
1357
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1358
              "              )\n",
1359
              "              (lora_embedding_A): ParameterDict()\n",
1360
              "              (lora_embedding_B): ParameterDict()\n",
1361
              "            )\n",
1362
              "            (out_proj): Linear4bit(\n",
1363
              "              in_features=2048, out_features=2048, bias=True\n",
1364
              "              (lora_dropout): ModuleDict(\n",
1365
              "                (default): Dropout(p=0.05, inplace=False)\n",
1366
              "              )\n",
1367
              "              (lora_A): ModuleDict(\n",
1368
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1369
              "              )\n",
1370
              "              (lora_B): ModuleDict(\n",
1371
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1372
              "              )\n",
1373
              "              (lora_embedding_A): ParameterDict()\n",
1374
              "              (lora_embedding_B): ParameterDict()\n",
1375
              "            )\n",
1376
              "            (inner_attn): SelfAttention(\n",
1377
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1378
              "            )\n",
1379
              "            (inner_cross_attn): CrossAttention(\n",
1380
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1381
              "            )\n",
1382
              "          )\n",
1383
              "          (mlp): MLP(\n",
1384
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1385
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1386
              "            (act): NewGELUActivation()\n",
1387
              "          )\n",
1388
              "        )\n",
1389
              "        (4): ParallelBlock(\n",
1390
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1391
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1392
              "          (mixer): MHA(\n",
1393
              "            (rotary_emb): RotaryEmbedding()\n",
1394
              "            (Wqkv): Linear4bit(\n",
1395
              "              in_features=2048, out_features=6144, bias=True\n",
1396
              "              (lora_dropout): ModuleDict(\n",
1397
              "                (default): Dropout(p=0.05, inplace=False)\n",
1398
              "              )\n",
1399
              "              (lora_A): ModuleDict(\n",
1400
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1401
              "              )\n",
1402
              "              (lora_B): ModuleDict(\n",
1403
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1404
              "              )\n",
1405
              "              (lora_embedding_A): ParameterDict()\n",
1406
              "              (lora_embedding_B): ParameterDict()\n",
1407
              "            )\n",
1408
              "            (out_proj): Linear4bit(\n",
1409
              "              in_features=2048, out_features=2048, bias=True\n",
1410
              "              (lora_dropout): ModuleDict(\n",
1411
              "                (default): Dropout(p=0.05, inplace=False)\n",
1412
              "              )\n",
1413
              "              (lora_A): ModuleDict(\n",
1414
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1415
              "              )\n",
1416
              "              (lora_B): ModuleDict(\n",
1417
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1418
              "              )\n",
1419
              "              (lora_embedding_A): ParameterDict()\n",
1420
              "              (lora_embedding_B): ParameterDict()\n",
1421
              "            )\n",
1422
              "            (inner_attn): SelfAttention(\n",
1423
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1424
              "            )\n",
1425
              "            (inner_cross_attn): CrossAttention(\n",
1426
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1427
              "            )\n",
1428
              "          )\n",
1429
              "          (mlp): MLP(\n",
1430
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1431
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1432
              "            (act): NewGELUActivation()\n",
1433
              "          )\n",
1434
              "        )\n",
1435
              "        (5): ParallelBlock(\n",
1436
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1437
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1438
              "          (mixer): MHA(\n",
1439
              "            (rotary_emb): RotaryEmbedding()\n",
1440
              "            (Wqkv): Linear4bit(\n",
1441
              "              in_features=2048, out_features=6144, bias=True\n",
1442
              "              (lora_dropout): ModuleDict(\n",
1443
              "                (default): Dropout(p=0.05, inplace=False)\n",
1444
              "              )\n",
1445
              "              (lora_A): ModuleDict(\n",
1446
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1447
              "              )\n",
1448
              "              (lora_B): ModuleDict(\n",
1449
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1450
              "              )\n",
1451
              "              (lora_embedding_A): ParameterDict()\n",
1452
              "              (lora_embedding_B): ParameterDict()\n",
1453
              "            )\n",
1454
              "            (out_proj): Linear4bit(\n",
1455
              "              in_features=2048, out_features=2048, bias=True\n",
1456
              "              (lora_dropout): ModuleDict(\n",
1457
              "                (default): Dropout(p=0.05, inplace=False)\n",
1458
              "              )\n",
1459
              "              (lora_A): ModuleDict(\n",
1460
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1461
              "              )\n",
1462
              "              (lora_B): ModuleDict(\n",
1463
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1464
              "              )\n",
1465
              "              (lora_embedding_A): ParameterDict()\n",
1466
              "              (lora_embedding_B): ParameterDict()\n",
1467
              "            )\n",
1468
              "            (inner_attn): SelfAttention(\n",
1469
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1470
              "            )\n",
1471
              "            (inner_cross_attn): CrossAttention(\n",
1472
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1473
              "            )\n",
1474
              "          )\n",
1475
              "          (mlp): MLP(\n",
1476
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1477
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1478
              "            (act): NewGELUActivation()\n",
1479
              "          )\n",
1480
              "        )\n",
1481
              "        (6): ParallelBlock(\n",
1482
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1483
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1484
              "          (mixer): MHA(\n",
1485
              "            (rotary_emb): RotaryEmbedding()\n",
1486
              "            (Wqkv): Linear4bit(\n",
1487
              "              in_features=2048, out_features=6144, bias=True\n",
1488
              "              (lora_dropout): ModuleDict(\n",
1489
              "                (default): Dropout(p=0.05, inplace=False)\n",
1490
              "              )\n",
1491
              "              (lora_A): ModuleDict(\n",
1492
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1493
              "              )\n",
1494
              "              (lora_B): ModuleDict(\n",
1495
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1496
              "              )\n",
1497
              "              (lora_embedding_A): ParameterDict()\n",
1498
              "              (lora_embedding_B): ParameterDict()\n",
1499
              "            )\n",
1500
              "            (out_proj): Linear4bit(\n",
1501
              "              in_features=2048, out_features=2048, bias=True\n",
1502
              "              (lora_dropout): ModuleDict(\n",
1503
              "                (default): Dropout(p=0.05, inplace=False)\n",
1504
              "              )\n",
1505
              "              (lora_A): ModuleDict(\n",
1506
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1507
              "              )\n",
1508
              "              (lora_B): ModuleDict(\n",
1509
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1510
              "              )\n",
1511
              "              (lora_embedding_A): ParameterDict()\n",
1512
              "              (lora_embedding_B): ParameterDict()\n",
1513
              "            )\n",
1514
              "            (inner_attn): SelfAttention(\n",
1515
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1516
              "            )\n",
1517
              "            (inner_cross_attn): CrossAttention(\n",
1518
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1519
              "            )\n",
1520
              "          )\n",
1521
              "          (mlp): MLP(\n",
1522
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1523
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1524
              "            (act): NewGELUActivation()\n",
1525
              "          )\n",
1526
              "        )\n",
1527
              "        (7): ParallelBlock(\n",
1528
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1529
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1530
              "          (mixer): MHA(\n",
1531
              "            (rotary_emb): RotaryEmbedding()\n",
1532
              "            (Wqkv): Linear4bit(\n",
1533
              "              in_features=2048, out_features=6144, bias=True\n",
1534
              "              (lora_dropout): ModuleDict(\n",
1535
              "                (default): Dropout(p=0.05, inplace=False)\n",
1536
              "              )\n",
1537
              "              (lora_A): ModuleDict(\n",
1538
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1539
              "              )\n",
1540
              "              (lora_B): ModuleDict(\n",
1541
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1542
              "              )\n",
1543
              "              (lora_embedding_A): ParameterDict()\n",
1544
              "              (lora_embedding_B): ParameterDict()\n",
1545
              "            )\n",
1546
              "            (out_proj): Linear4bit(\n",
1547
              "              in_features=2048, out_features=2048, bias=True\n",
1548
              "              (lora_dropout): ModuleDict(\n",
1549
              "                (default): Dropout(p=0.05, inplace=False)\n",
1550
              "              )\n",
1551
              "              (lora_A): ModuleDict(\n",
1552
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1553
              "              )\n",
1554
              "              (lora_B): ModuleDict(\n",
1555
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1556
              "              )\n",
1557
              "              (lora_embedding_A): ParameterDict()\n",
1558
              "              (lora_embedding_B): ParameterDict()\n",
1559
              "            )\n",
1560
              "            (inner_attn): SelfAttention(\n",
1561
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1562
              "            )\n",
1563
              "            (inner_cross_attn): CrossAttention(\n",
1564
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1565
              "            )\n",
1566
              "          )\n",
1567
              "          (mlp): MLP(\n",
1568
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1569
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1570
              "            (act): NewGELUActivation()\n",
1571
              "          )\n",
1572
              "        )\n",
1573
              "        (8): ParallelBlock(\n",
1574
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1575
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1576
              "          (mixer): MHA(\n",
1577
              "            (rotary_emb): RotaryEmbedding()\n",
1578
              "            (Wqkv): Linear4bit(\n",
1579
              "              in_features=2048, out_features=6144, bias=True\n",
1580
              "              (lora_dropout): ModuleDict(\n",
1581
              "                (default): Dropout(p=0.05, inplace=False)\n",
1582
              "              )\n",
1583
              "              (lora_A): ModuleDict(\n",
1584
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1585
              "              )\n",
1586
              "              (lora_B): ModuleDict(\n",
1587
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1588
              "              )\n",
1589
              "              (lora_embedding_A): ParameterDict()\n",
1590
              "              (lora_embedding_B): ParameterDict()\n",
1591
              "            )\n",
1592
              "            (out_proj): Linear4bit(\n",
1593
              "              in_features=2048, out_features=2048, bias=True\n",
1594
              "              (lora_dropout): ModuleDict(\n",
1595
              "                (default): Dropout(p=0.05, inplace=False)\n",
1596
              "              )\n",
1597
              "              (lora_A): ModuleDict(\n",
1598
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1599
              "              )\n",
1600
              "              (lora_B): ModuleDict(\n",
1601
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1602
              "              )\n",
1603
              "              (lora_embedding_A): ParameterDict()\n",
1604
              "              (lora_embedding_B): ParameterDict()\n",
1605
              "            )\n",
1606
              "            (inner_attn): SelfAttention(\n",
1607
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1608
              "            )\n",
1609
              "            (inner_cross_attn): CrossAttention(\n",
1610
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1611
              "            )\n",
1612
              "          )\n",
1613
              "          (mlp): MLP(\n",
1614
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1615
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1616
              "            (act): NewGELUActivation()\n",
1617
              "          )\n",
1618
              "        )\n",
1619
              "        (9): ParallelBlock(\n",
1620
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1621
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1622
              "          (mixer): MHA(\n",
1623
              "            (rotary_emb): RotaryEmbedding()\n",
1624
              "            (Wqkv): Linear4bit(\n",
1625
              "              in_features=2048, out_features=6144, bias=True\n",
1626
              "              (lora_dropout): ModuleDict(\n",
1627
              "                (default): Dropout(p=0.05, inplace=False)\n",
1628
              "              )\n",
1629
              "              (lora_A): ModuleDict(\n",
1630
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1631
              "              )\n",
1632
              "              (lora_B): ModuleDict(\n",
1633
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1634
              "              )\n",
1635
              "              (lora_embedding_A): ParameterDict()\n",
1636
              "              (lora_embedding_B): ParameterDict()\n",
1637
              "            )\n",
1638
              "            (out_proj): Linear4bit(\n",
1639
              "              in_features=2048, out_features=2048, bias=True\n",
1640
              "              (lora_dropout): ModuleDict(\n",
1641
              "                (default): Dropout(p=0.05, inplace=False)\n",
1642
              "              )\n",
1643
              "              (lora_A): ModuleDict(\n",
1644
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1645
              "              )\n",
1646
              "              (lora_B): ModuleDict(\n",
1647
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1648
              "              )\n",
1649
              "              (lora_embedding_A): ParameterDict()\n",
1650
              "              (lora_embedding_B): ParameterDict()\n",
1651
              "            )\n",
1652
              "            (inner_attn): SelfAttention(\n",
1653
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1654
              "            )\n",
1655
              "            (inner_cross_attn): CrossAttention(\n",
1656
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1657
              "            )\n",
1658
              "          )\n",
1659
              "          (mlp): MLP(\n",
1660
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1661
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1662
              "            (act): NewGELUActivation()\n",
1663
              "          )\n",
1664
              "        )\n",
1665
              "        (10): ParallelBlock(\n",
1666
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1667
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1668
              "          (mixer): MHA(\n",
1669
              "            (rotary_emb): RotaryEmbedding()\n",
1670
              "            (Wqkv): Linear4bit(\n",
1671
              "              in_features=2048, out_features=6144, bias=True\n",
1672
              "              (lora_dropout): ModuleDict(\n",
1673
              "                (default): Dropout(p=0.05, inplace=False)\n",
1674
              "              )\n",
1675
              "              (lora_A): ModuleDict(\n",
1676
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1677
              "              )\n",
1678
              "              (lora_B): ModuleDict(\n",
1679
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1680
              "              )\n",
1681
              "              (lora_embedding_A): ParameterDict()\n",
1682
              "              (lora_embedding_B): ParameterDict()\n",
1683
              "            )\n",
1684
              "            (out_proj): Linear4bit(\n",
1685
              "              in_features=2048, out_features=2048, bias=True\n",
1686
              "              (lora_dropout): ModuleDict(\n",
1687
              "                (default): Dropout(p=0.05, inplace=False)\n",
1688
              "              )\n",
1689
              "              (lora_A): ModuleDict(\n",
1690
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1691
              "              )\n",
1692
              "              (lora_B): ModuleDict(\n",
1693
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1694
              "              )\n",
1695
              "              (lora_embedding_A): ParameterDict()\n",
1696
              "              (lora_embedding_B): ParameterDict()\n",
1697
              "            )\n",
1698
              "            (inner_attn): SelfAttention(\n",
1699
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1700
              "            )\n",
1701
              "            (inner_cross_attn): CrossAttention(\n",
1702
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1703
              "            )\n",
1704
              "          )\n",
1705
              "          (mlp): MLP(\n",
1706
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1707
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1708
              "            (act): NewGELUActivation()\n",
1709
              "          )\n",
1710
              "        )\n",
1711
              "        (11): ParallelBlock(\n",
1712
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1713
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1714
              "          (mixer): MHA(\n",
1715
              "            (rotary_emb): RotaryEmbedding()\n",
1716
              "            (Wqkv): Linear4bit(\n",
1717
              "              in_features=2048, out_features=6144, bias=True\n",
1718
              "              (lora_dropout): ModuleDict(\n",
1719
              "                (default): Dropout(p=0.05, inplace=False)\n",
1720
              "              )\n",
1721
              "              (lora_A): ModuleDict(\n",
1722
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1723
              "              )\n",
1724
              "              (lora_B): ModuleDict(\n",
1725
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1726
              "              )\n",
1727
              "              (lora_embedding_A): ParameterDict()\n",
1728
              "              (lora_embedding_B): ParameterDict()\n",
1729
              "            )\n",
1730
              "            (out_proj): Linear4bit(\n",
1731
              "              in_features=2048, out_features=2048, bias=True\n",
1732
              "              (lora_dropout): ModuleDict(\n",
1733
              "                (default): Dropout(p=0.05, inplace=False)\n",
1734
              "              )\n",
1735
              "              (lora_A): ModuleDict(\n",
1736
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1737
              "              )\n",
1738
              "              (lora_B): ModuleDict(\n",
1739
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1740
              "              )\n",
1741
              "              (lora_embedding_A): ParameterDict()\n",
1742
              "              (lora_embedding_B): ParameterDict()\n",
1743
              "            )\n",
1744
              "            (inner_attn): SelfAttention(\n",
1745
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1746
              "            )\n",
1747
              "            (inner_cross_attn): CrossAttention(\n",
1748
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1749
              "            )\n",
1750
              "          )\n",
1751
              "          (mlp): MLP(\n",
1752
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1753
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1754
              "            (act): NewGELUActivation()\n",
1755
              "          )\n",
1756
              "        )\n",
1757
              "        (12): ParallelBlock(\n",
1758
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1759
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1760
              "          (mixer): MHA(\n",
1761
              "            (rotary_emb): RotaryEmbedding()\n",
1762
              "            (Wqkv): Linear4bit(\n",
1763
              "              in_features=2048, out_features=6144, bias=True\n",
1764
              "              (lora_dropout): ModuleDict(\n",
1765
              "                (default): Dropout(p=0.05, inplace=False)\n",
1766
              "              )\n",
1767
              "              (lora_A): ModuleDict(\n",
1768
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1769
              "              )\n",
1770
              "              (lora_B): ModuleDict(\n",
1771
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1772
              "              )\n",
1773
              "              (lora_embedding_A): ParameterDict()\n",
1774
              "              (lora_embedding_B): ParameterDict()\n",
1775
              "            )\n",
1776
              "            (out_proj): Linear4bit(\n",
1777
              "              in_features=2048, out_features=2048, bias=True\n",
1778
              "              (lora_dropout): ModuleDict(\n",
1779
              "                (default): Dropout(p=0.05, inplace=False)\n",
1780
              "              )\n",
1781
              "              (lora_A): ModuleDict(\n",
1782
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1783
              "              )\n",
1784
              "              (lora_B): ModuleDict(\n",
1785
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1786
              "              )\n",
1787
              "              (lora_embedding_A): ParameterDict()\n",
1788
              "              (lora_embedding_B): ParameterDict()\n",
1789
              "            )\n",
1790
              "            (inner_attn): SelfAttention(\n",
1791
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1792
              "            )\n",
1793
              "            (inner_cross_attn): CrossAttention(\n",
1794
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1795
              "            )\n",
1796
              "          )\n",
1797
              "          (mlp): MLP(\n",
1798
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1799
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1800
              "            (act): NewGELUActivation()\n",
1801
              "          )\n",
1802
              "        )\n",
1803
              "        (13): ParallelBlock(\n",
1804
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1805
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1806
              "          (mixer): MHA(\n",
1807
              "            (rotary_emb): RotaryEmbedding()\n",
1808
              "            (Wqkv): Linear4bit(\n",
1809
              "              in_features=2048, out_features=6144, bias=True\n",
1810
              "              (lora_dropout): ModuleDict(\n",
1811
              "                (default): Dropout(p=0.05, inplace=False)\n",
1812
              "              )\n",
1813
              "              (lora_A): ModuleDict(\n",
1814
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1815
              "              )\n",
1816
              "              (lora_B): ModuleDict(\n",
1817
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1818
              "              )\n",
1819
              "              (lora_embedding_A): ParameterDict()\n",
1820
              "              (lora_embedding_B): ParameterDict()\n",
1821
              "            )\n",
1822
              "            (out_proj): Linear4bit(\n",
1823
              "              in_features=2048, out_features=2048, bias=True\n",
1824
              "              (lora_dropout): ModuleDict(\n",
1825
              "                (default): Dropout(p=0.05, inplace=False)\n",
1826
              "              )\n",
1827
              "              (lora_A): ModuleDict(\n",
1828
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1829
              "              )\n",
1830
              "              (lora_B): ModuleDict(\n",
1831
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1832
              "              )\n",
1833
              "              (lora_embedding_A): ParameterDict()\n",
1834
              "              (lora_embedding_B): ParameterDict()\n",
1835
              "            )\n",
1836
              "            (inner_attn): SelfAttention(\n",
1837
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1838
              "            )\n",
1839
              "            (inner_cross_attn): CrossAttention(\n",
1840
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1841
              "            )\n",
1842
              "          )\n",
1843
              "          (mlp): MLP(\n",
1844
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1845
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1846
              "            (act): NewGELUActivation()\n",
1847
              "          )\n",
1848
              "        )\n",
1849
              "        (14): ParallelBlock(\n",
1850
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1851
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1852
              "          (mixer): MHA(\n",
1853
              "            (rotary_emb): RotaryEmbedding()\n",
1854
              "            (Wqkv): Linear4bit(\n",
1855
              "              in_features=2048, out_features=6144, bias=True\n",
1856
              "              (lora_dropout): ModuleDict(\n",
1857
              "                (default): Dropout(p=0.05, inplace=False)\n",
1858
              "              )\n",
1859
              "              (lora_A): ModuleDict(\n",
1860
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1861
              "              )\n",
1862
              "              (lora_B): ModuleDict(\n",
1863
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1864
              "              )\n",
1865
              "              (lora_embedding_A): ParameterDict()\n",
1866
              "              (lora_embedding_B): ParameterDict()\n",
1867
              "            )\n",
1868
              "            (out_proj): Linear4bit(\n",
1869
              "              in_features=2048, out_features=2048, bias=True\n",
1870
              "              (lora_dropout): ModuleDict(\n",
1871
              "                (default): Dropout(p=0.05, inplace=False)\n",
1872
              "              )\n",
1873
              "              (lora_A): ModuleDict(\n",
1874
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1875
              "              )\n",
1876
              "              (lora_B): ModuleDict(\n",
1877
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1878
              "              )\n",
1879
              "              (lora_embedding_A): ParameterDict()\n",
1880
              "              (lora_embedding_B): ParameterDict()\n",
1881
              "            )\n",
1882
              "            (inner_attn): SelfAttention(\n",
1883
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1884
              "            )\n",
1885
              "            (inner_cross_attn): CrossAttention(\n",
1886
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1887
              "            )\n",
1888
              "          )\n",
1889
              "          (mlp): MLP(\n",
1890
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1891
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1892
              "            (act): NewGELUActivation()\n",
1893
              "          )\n",
1894
              "        )\n",
1895
              "        (15): ParallelBlock(\n",
1896
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1897
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1898
              "          (mixer): MHA(\n",
1899
              "            (rotary_emb): RotaryEmbedding()\n",
1900
              "            (Wqkv): Linear4bit(\n",
1901
              "              in_features=2048, out_features=6144, bias=True\n",
1902
              "              (lora_dropout): ModuleDict(\n",
1903
              "                (default): Dropout(p=0.05, inplace=False)\n",
1904
              "              )\n",
1905
              "              (lora_A): ModuleDict(\n",
1906
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1907
              "              )\n",
1908
              "              (lora_B): ModuleDict(\n",
1909
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1910
              "              )\n",
1911
              "              (lora_embedding_A): ParameterDict()\n",
1912
              "              (lora_embedding_B): ParameterDict()\n",
1913
              "            )\n",
1914
              "            (out_proj): Linear4bit(\n",
1915
              "              in_features=2048, out_features=2048, bias=True\n",
1916
              "              (lora_dropout): ModuleDict(\n",
1917
              "                (default): Dropout(p=0.05, inplace=False)\n",
1918
              "              )\n",
1919
              "              (lora_A): ModuleDict(\n",
1920
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1921
              "              )\n",
1922
              "              (lora_B): ModuleDict(\n",
1923
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1924
              "              )\n",
1925
              "              (lora_embedding_A): ParameterDict()\n",
1926
              "              (lora_embedding_B): ParameterDict()\n",
1927
              "            )\n",
1928
              "            (inner_attn): SelfAttention(\n",
1929
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1930
              "            )\n",
1931
              "            (inner_cross_attn): CrossAttention(\n",
1932
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1933
              "            )\n",
1934
              "          )\n",
1935
              "          (mlp): MLP(\n",
1936
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1937
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1938
              "            (act): NewGELUActivation()\n",
1939
              "          )\n",
1940
              "        )\n",
1941
              "        (16): ParallelBlock(\n",
1942
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1943
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1944
              "          (mixer): MHA(\n",
1945
              "            (rotary_emb): RotaryEmbedding()\n",
1946
              "            (Wqkv): Linear4bit(\n",
1947
              "              in_features=2048, out_features=6144, bias=True\n",
1948
              "              (lora_dropout): ModuleDict(\n",
1949
              "                (default): Dropout(p=0.05, inplace=False)\n",
1950
              "              )\n",
1951
              "              (lora_A): ModuleDict(\n",
1952
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1953
              "              )\n",
1954
              "              (lora_B): ModuleDict(\n",
1955
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
1956
              "              )\n",
1957
              "              (lora_embedding_A): ParameterDict()\n",
1958
              "              (lora_embedding_B): ParameterDict()\n",
1959
              "            )\n",
1960
              "            (out_proj): Linear4bit(\n",
1961
              "              in_features=2048, out_features=2048, bias=True\n",
1962
              "              (lora_dropout): ModuleDict(\n",
1963
              "                (default): Dropout(p=0.05, inplace=False)\n",
1964
              "              )\n",
1965
              "              (lora_A): ModuleDict(\n",
1966
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1967
              "              )\n",
1968
              "              (lora_B): ModuleDict(\n",
1969
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
1970
              "              )\n",
1971
              "              (lora_embedding_A): ParameterDict()\n",
1972
              "              (lora_embedding_B): ParameterDict()\n",
1973
              "            )\n",
1974
              "            (inner_attn): SelfAttention(\n",
1975
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1976
              "            )\n",
1977
              "            (inner_cross_attn): CrossAttention(\n",
1978
              "              (drop): Dropout(p=0.0, inplace=False)\n",
1979
              "            )\n",
1980
              "          )\n",
1981
              "          (mlp): MLP(\n",
1982
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
1983
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
1984
              "            (act): NewGELUActivation()\n",
1985
              "          )\n",
1986
              "        )\n",
1987
              "        (17): ParallelBlock(\n",
1988
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
1989
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
1990
              "          (mixer): MHA(\n",
1991
              "            (rotary_emb): RotaryEmbedding()\n",
1992
              "            (Wqkv): Linear4bit(\n",
1993
              "              in_features=2048, out_features=6144, bias=True\n",
1994
              "              (lora_dropout): ModuleDict(\n",
1995
              "                (default): Dropout(p=0.05, inplace=False)\n",
1996
              "              )\n",
1997
              "              (lora_A): ModuleDict(\n",
1998
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
1999
              "              )\n",
2000
              "              (lora_B): ModuleDict(\n",
2001
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
2002
              "              )\n",
2003
              "              (lora_embedding_A): ParameterDict()\n",
2004
              "              (lora_embedding_B): ParameterDict()\n",
2005
              "            )\n",
2006
              "            (out_proj): Linear4bit(\n",
2007
              "              in_features=2048, out_features=2048, bias=True\n",
2008
              "              (lora_dropout): ModuleDict(\n",
2009
              "                (default): Dropout(p=0.05, inplace=False)\n",
2010
              "              )\n",
2011
              "              (lora_A): ModuleDict(\n",
2012
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2013
              "              )\n",
2014
              "              (lora_B): ModuleDict(\n",
2015
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
2016
              "              )\n",
2017
              "              (lora_embedding_A): ParameterDict()\n",
2018
              "              (lora_embedding_B): ParameterDict()\n",
2019
              "            )\n",
2020
              "            (inner_attn): SelfAttention(\n",
2021
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2022
              "            )\n",
2023
              "            (inner_cross_attn): CrossAttention(\n",
2024
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2025
              "            )\n",
2026
              "          )\n",
2027
              "          (mlp): MLP(\n",
2028
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
2029
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
2030
              "            (act): NewGELUActivation()\n",
2031
              "          )\n",
2032
              "        )\n",
2033
              "        (18): ParallelBlock(\n",
2034
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2035
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2036
              "          (mixer): MHA(\n",
2037
              "            (rotary_emb): RotaryEmbedding()\n",
2038
              "            (Wqkv): Linear4bit(\n",
2039
              "              in_features=2048, out_features=6144, bias=True\n",
2040
              "              (lora_dropout): ModuleDict(\n",
2041
              "                (default): Dropout(p=0.05, inplace=False)\n",
2042
              "              )\n",
2043
              "              (lora_A): ModuleDict(\n",
2044
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2045
              "              )\n",
2046
              "              (lora_B): ModuleDict(\n",
2047
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
2048
              "              )\n",
2049
              "              (lora_embedding_A): ParameterDict()\n",
2050
              "              (lora_embedding_B): ParameterDict()\n",
2051
              "            )\n",
2052
              "            (out_proj): Linear4bit(\n",
2053
              "              in_features=2048, out_features=2048, bias=True\n",
2054
              "              (lora_dropout): ModuleDict(\n",
2055
              "                (default): Dropout(p=0.05, inplace=False)\n",
2056
              "              )\n",
2057
              "              (lora_A): ModuleDict(\n",
2058
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2059
              "              )\n",
2060
              "              (lora_B): ModuleDict(\n",
2061
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
2062
              "              )\n",
2063
              "              (lora_embedding_A): ParameterDict()\n",
2064
              "              (lora_embedding_B): ParameterDict()\n",
2065
              "            )\n",
2066
              "            (inner_attn): SelfAttention(\n",
2067
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2068
              "            )\n",
2069
              "            (inner_cross_attn): CrossAttention(\n",
2070
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2071
              "            )\n",
2072
              "          )\n",
2073
              "          (mlp): MLP(\n",
2074
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
2075
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
2076
              "            (act): NewGELUActivation()\n",
2077
              "          )\n",
2078
              "        )\n",
2079
              "        (19): ParallelBlock(\n",
2080
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2081
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2082
              "          (mixer): MHA(\n",
2083
              "            (rotary_emb): RotaryEmbedding()\n",
2084
              "            (Wqkv): Linear4bit(\n",
2085
              "              in_features=2048, out_features=6144, bias=True\n",
2086
              "              (lora_dropout): ModuleDict(\n",
2087
              "                (default): Dropout(p=0.05, inplace=False)\n",
2088
              "              )\n",
2089
              "              (lora_A): ModuleDict(\n",
2090
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2091
              "              )\n",
2092
              "              (lora_B): ModuleDict(\n",
2093
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
2094
              "              )\n",
2095
              "              (lora_embedding_A): ParameterDict()\n",
2096
              "              (lora_embedding_B): ParameterDict()\n",
2097
              "            )\n",
2098
              "            (out_proj): Linear4bit(\n",
2099
              "              in_features=2048, out_features=2048, bias=True\n",
2100
              "              (lora_dropout): ModuleDict(\n",
2101
              "                (default): Dropout(p=0.05, inplace=False)\n",
2102
              "              )\n",
2103
              "              (lora_A): ModuleDict(\n",
2104
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2105
              "              )\n",
2106
              "              (lora_B): ModuleDict(\n",
2107
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
2108
              "              )\n",
2109
              "              (lora_embedding_A): ParameterDict()\n",
2110
              "              (lora_embedding_B): ParameterDict()\n",
2111
              "            )\n",
2112
              "            (inner_attn): SelfAttention(\n",
2113
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2114
              "            )\n",
2115
              "            (inner_cross_attn): CrossAttention(\n",
2116
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2117
              "            )\n",
2118
              "          )\n",
2119
              "          (mlp): MLP(\n",
2120
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
2121
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
2122
              "            (act): NewGELUActivation()\n",
2123
              "          )\n",
2124
              "        )\n",
2125
              "        (20): ParallelBlock(\n",
2126
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2127
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2128
              "          (mixer): MHA(\n",
2129
              "            (rotary_emb): RotaryEmbedding()\n",
2130
              "            (Wqkv): Linear4bit(\n",
2131
              "              in_features=2048, out_features=6144, bias=True\n",
2132
              "              (lora_dropout): ModuleDict(\n",
2133
              "                (default): Dropout(p=0.05, inplace=False)\n",
2134
              "              )\n",
2135
              "              (lora_A): ModuleDict(\n",
2136
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2137
              "              )\n",
2138
              "              (lora_B): ModuleDict(\n",
2139
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
2140
              "              )\n",
2141
              "              (lora_embedding_A): ParameterDict()\n",
2142
              "              (lora_embedding_B): ParameterDict()\n",
2143
              "            )\n",
2144
              "            (out_proj): Linear4bit(\n",
2145
              "              in_features=2048, out_features=2048, bias=True\n",
2146
              "              (lora_dropout): ModuleDict(\n",
2147
              "                (default): Dropout(p=0.05, inplace=False)\n",
2148
              "              )\n",
2149
              "              (lora_A): ModuleDict(\n",
2150
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2151
              "              )\n",
2152
              "              (lora_B): ModuleDict(\n",
2153
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
2154
              "              )\n",
2155
              "              (lora_embedding_A): ParameterDict()\n",
2156
              "              (lora_embedding_B): ParameterDict()\n",
2157
              "            )\n",
2158
              "            (inner_attn): SelfAttention(\n",
2159
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2160
              "            )\n",
2161
              "            (inner_cross_attn): CrossAttention(\n",
2162
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2163
              "            )\n",
2164
              "          )\n",
2165
              "          (mlp): MLP(\n",
2166
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
2167
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
2168
              "            (act): NewGELUActivation()\n",
2169
              "          )\n",
2170
              "        )\n",
2171
              "        (21): ParallelBlock(\n",
2172
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2173
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2174
              "          (mixer): MHA(\n",
2175
              "            (rotary_emb): RotaryEmbedding()\n",
2176
              "            (Wqkv): Linear4bit(\n",
2177
              "              in_features=2048, out_features=6144, bias=True\n",
2178
              "              (lora_dropout): ModuleDict(\n",
2179
              "                (default): Dropout(p=0.05, inplace=False)\n",
2180
              "              )\n",
2181
              "              (lora_A): ModuleDict(\n",
2182
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2183
              "              )\n",
2184
              "              (lora_B): ModuleDict(\n",
2185
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
2186
              "              )\n",
2187
              "              (lora_embedding_A): ParameterDict()\n",
2188
              "              (lora_embedding_B): ParameterDict()\n",
2189
              "            )\n",
2190
              "            (out_proj): Linear4bit(\n",
2191
              "              in_features=2048, out_features=2048, bias=True\n",
2192
              "              (lora_dropout): ModuleDict(\n",
2193
              "                (default): Dropout(p=0.05, inplace=False)\n",
2194
              "              )\n",
2195
              "              (lora_A): ModuleDict(\n",
2196
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2197
              "              )\n",
2198
              "              (lora_B): ModuleDict(\n",
2199
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
2200
              "              )\n",
2201
              "              (lora_embedding_A): ParameterDict()\n",
2202
              "              (lora_embedding_B): ParameterDict()\n",
2203
              "            )\n",
2204
              "            (inner_attn): SelfAttention(\n",
2205
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2206
              "            )\n",
2207
              "            (inner_cross_attn): CrossAttention(\n",
2208
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2209
              "            )\n",
2210
              "          )\n",
2211
              "          (mlp): MLP(\n",
2212
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
2213
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
2214
              "            (act): NewGELUActivation()\n",
2215
              "          )\n",
2216
              "        )\n",
2217
              "        (22): ParallelBlock(\n",
2218
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2219
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2220
              "          (mixer): MHA(\n",
2221
              "            (rotary_emb): RotaryEmbedding()\n",
2222
              "            (Wqkv): Linear4bit(\n",
2223
              "              in_features=2048, out_features=6144, bias=True\n",
2224
              "              (lora_dropout): ModuleDict(\n",
2225
              "                (default): Dropout(p=0.05, inplace=False)\n",
2226
              "              )\n",
2227
              "              (lora_A): ModuleDict(\n",
2228
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2229
              "              )\n",
2230
              "              (lora_B): ModuleDict(\n",
2231
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
2232
              "              )\n",
2233
              "              (lora_embedding_A): ParameterDict()\n",
2234
              "              (lora_embedding_B): ParameterDict()\n",
2235
              "            )\n",
2236
              "            (out_proj): Linear4bit(\n",
2237
              "              in_features=2048, out_features=2048, bias=True\n",
2238
              "              (lora_dropout): ModuleDict(\n",
2239
              "                (default): Dropout(p=0.05, inplace=False)\n",
2240
              "              )\n",
2241
              "              (lora_A): ModuleDict(\n",
2242
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2243
              "              )\n",
2244
              "              (lora_B): ModuleDict(\n",
2245
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
2246
              "              )\n",
2247
              "              (lora_embedding_A): ParameterDict()\n",
2248
              "              (lora_embedding_B): ParameterDict()\n",
2249
              "            )\n",
2250
              "            (inner_attn): SelfAttention(\n",
2251
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2252
              "            )\n",
2253
              "            (inner_cross_attn): CrossAttention(\n",
2254
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2255
              "            )\n",
2256
              "          )\n",
2257
              "          (mlp): MLP(\n",
2258
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
2259
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
2260
              "            (act): NewGELUActivation()\n",
2261
              "          )\n",
2262
              "        )\n",
2263
              "        (23): ParallelBlock(\n",
2264
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2265
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2266
              "          (mixer): MHA(\n",
2267
              "            (rotary_emb): RotaryEmbedding()\n",
2268
              "            (Wqkv): Linear4bit(\n",
2269
              "              in_features=2048, out_features=6144, bias=True\n",
2270
              "              (lora_dropout): ModuleDict(\n",
2271
              "                (default): Dropout(p=0.05, inplace=False)\n",
2272
              "              )\n",
2273
              "              (lora_A): ModuleDict(\n",
2274
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2275
              "              )\n",
2276
              "              (lora_B): ModuleDict(\n",
2277
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
2278
              "              )\n",
2279
              "              (lora_embedding_A): ParameterDict()\n",
2280
              "              (lora_embedding_B): ParameterDict()\n",
2281
              "            )\n",
2282
              "            (out_proj): Linear4bit(\n",
2283
              "              in_features=2048, out_features=2048, bias=True\n",
2284
              "              (lora_dropout): ModuleDict(\n",
2285
              "                (default): Dropout(p=0.05, inplace=False)\n",
2286
              "              )\n",
2287
              "              (lora_A): ModuleDict(\n",
2288
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2289
              "              )\n",
2290
              "              (lora_B): ModuleDict(\n",
2291
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
2292
              "              )\n",
2293
              "              (lora_embedding_A): ParameterDict()\n",
2294
              "              (lora_embedding_B): ParameterDict()\n",
2295
              "            )\n",
2296
              "            (inner_attn): SelfAttention(\n",
2297
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2298
              "            )\n",
2299
              "            (inner_cross_attn): CrossAttention(\n",
2300
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2301
              "            )\n",
2302
              "          )\n",
2303
              "          (mlp): MLP(\n",
2304
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
2305
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
2306
              "            (act): NewGELUActivation()\n",
2307
              "          )\n",
2308
              "        )\n",
2309
              "        (24): ParallelBlock(\n",
2310
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2311
              "          (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2312
              "          (mixer): MHA(\n",
2313
              "            (rotary_emb): RotaryEmbedding()\n",
2314
              "            (Wqkv): Linear4bit(\n",
2315
              "              in_features=2048, out_features=6144, bias=True\n",
2316
              "              (lora_dropout): ModuleDict(\n",
2317
              "                (default): Dropout(p=0.05, inplace=False)\n",
2318
              "              )\n",
2319
              "              (lora_A): ModuleDict(\n",
2320
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2321
              "              )\n",
2322
              "              (lora_B): ModuleDict(\n",
2323
              "                (default): Linear(in_features=16, out_features=6144, bias=False)\n",
2324
              "              )\n",
2325
              "              (lora_embedding_A): ParameterDict()\n",
2326
              "              (lora_embedding_B): ParameterDict()\n",
2327
              "            )\n",
2328
              "            (out_proj): Linear4bit(\n",
2329
              "              in_features=2048, out_features=2048, bias=True\n",
2330
              "              (lora_dropout): ModuleDict(\n",
2331
              "                (default): Dropout(p=0.05, inplace=False)\n",
2332
              "              )\n",
2333
              "              (lora_A): ModuleDict(\n",
2334
              "                (default): Linear(in_features=2048, out_features=16, bias=False)\n",
2335
              "              )\n",
2336
              "              (lora_B): ModuleDict(\n",
2337
              "                (default): Linear(in_features=16, out_features=2048, bias=False)\n",
2338
              "              )\n",
2339
              "              (lora_embedding_A): ParameterDict()\n",
2340
              "              (lora_embedding_B): ParameterDict()\n",
2341
              "            )\n",
2342
              "            (inner_attn): SelfAttention(\n",
2343
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2344
              "            )\n",
2345
              "            (inner_cross_attn): CrossAttention(\n",
2346
              "              (drop): Dropout(p=0.0, inplace=False)\n",
2347
              "            )\n",
2348
              "          )\n",
2349
              "          (mlp): MLP(\n",
2350
              "            (fc1): Linear4bit(in_features=2048, out_features=8192, bias=True)\n",
2351
              "            (fc2): Linear4bit(in_features=8192, out_features=2048, bias=True)\n",
2352
              "            (act): NewGELUActivation()\n",
2353
              "          )\n",
2354
              "        )\n",
2355
              "        (25): CausalLMHead(\n",
2356
              "          (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2357
              "          (linear): Linear(in_features=2048, out_features=51200, bias=True)\n",
2358
              "        )\n",
2359
              "      )\n",
2360
              "      (loss): CausalLMLoss(\n",
2361
              "        (loss_fct): CrossEntropyLoss()\n",
2362
              "      )\n",
2363
              "    )\n",
2364
              "  )\n",
2365
              ")"
2366
            ]
2367
          },
2368
          "metadata": {},
2369
          "execution_count": 30
2370
        }
2371
      ],
2372
      "source": [
2373
        "trainer.model"
2374
      ]
2375
    },
2376
    {
2377
      "cell_type": "markdown",
2378
      "source": [
2379
        "## Inference"
2380
      ],
2381
      "metadata": {
2382
        "id": "7lSxtsWehGcy"
2383
      }
2384
    },
2385
    {
2386
      "cell_type": "code",
2387
      "source": [
2388
        "from peft import PeftModel\n",
2389
        "from transformers import AutoModelForCausalLM\n",
2390
        "import torch\n",
2391
        "model = AutoModelForCausalLM.from_pretrained(\"microsoft/phi-1_5\", trust_remote_code=True, torch_dtype=torch.float32)\n",
2392
        "peft_model = PeftModel.from_pretrained(model, \"ashishpatel26/phi-1_5-finetuned-dialogstudio\", from_transformers=True)\n",
2393
        "model = peft_model.merge_and_unload()\n",
2394
        "model"
2395
      ],
2396
      "metadata": {
2397
        "colab": {
2398
          "base_uri": "https://localhost:8080/",
2399
          "height": 1000,
2400
          "referenced_widgets": [
2401
            "18d7c57661f54a2f906b86e5b92a356d",
2402
            "e132669f57024ebcadc1f0d3899fbda2",
2403
            "f3e78fd1331b4463a243475e12bd2480",
2404
            "386c7bc116b849aaa2bd4c8b0c27b0e9",
2405
            "4385c5f8fc5d4d179e02ebf65aae4e0f",
2406
            "59032aea122142da8744876e7d561bca",
2407
            "b7bf29e09c554482823942f17fb09217",
2408
            "faf28ec7a6304a1d8e52952aff97c6b4",
2409
            "f5ed4018421f446da4ff34741a166d38",
2410
            "1919c4500c88418dad25ed0801033031",
2411
            "c4a29910b33d4a348ceef13239cf835e",
2412
            "31405710033848009cf8227a7611864f",
2413
            "cc862dc1f8884513b8eefb569ab50424",
2414
            "3cd7c95a507d459f86b9eadd7cfdcb85",
2415
            "683da23b78b54a8eb3c1984cd29bbeb2",
2416
            "f022a8aac72d490fb89495f01c929885",
2417
            "ac31ba38940c445e9305623046dc2473",
2418
            "1880da50605c435da03377a6e535d3a6",
2419
            "d645078ee2094f37a1bfbaa6727474bb",
2420
            "a0c4211bdd9e4857b16fbad1d7b1d3e1",
2421
            "3bee676ed0274dee9160f3260f253acf",
2422
            "93909168ffc24b5ba6c03a2a067b99c1"
2423
          ]
2424
        },
2425
        "id": "e43OUEfYOzFF",
2426
        "outputId": "76eec92a-79aa-41af-de41-63b60483470c"
2427
      },
2428
      "execution_count": 1,
2429
      "outputs": [
2430
        {
2431
          "output_type": "display_data",
2432
          "data": {
2433
            "text/plain": [
2434
              "Downloading (…)/adapter_config.json:   0%|          | 0.00/440 [00:00<?, ?B/s]"
2435
            ],
2436
            "application/vnd.jupyter.widget-view+json": {
2437
              "version_major": 2,
2438
              "version_minor": 0,
2439
              "model_id": "18d7c57661f54a2f906b86e5b92a356d"
2440
            }
2441
          },
2442
          "metadata": {}
2443
        },
2444
        {
2445
          "output_type": "display_data",
2446
          "data": {
2447
            "text/plain": [
2448
              "Downloading adapter_model.bin:   0%|          | 0.00/18.9M [00:00<?, ?B/s]"
2449
            ],
2450
            "application/vnd.jupyter.widget-view+json": {
2451
              "version_major": 2,
2452
              "version_minor": 0,
2453
              "model_id": "31405710033848009cf8227a7611864f"
2454
            }
2455
          },
2456
          "metadata": {}
2457
        },
2458
        {
2459
          "output_type": "execute_result",
2460
          "data": {
2461
            "text/plain": [
2462
              "MixFormerSequentialForCausalLM(\n",
2463
              "  (layers): Sequential(\n",
2464
              "    (0): Embedding(\n",
2465
              "      (wte): Embedding(51200, 2048)\n",
2466
              "      (drop): Dropout(p=0.0, inplace=False)\n",
2467
              "    )\n",
2468
              "    (1): ParallelBlock(\n",
2469
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2470
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2471
              "      (mixer): MHA(\n",
2472
              "        (rotary_emb): RotaryEmbedding()\n",
2473
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2474
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2475
              "        (inner_attn): SelfAttention(\n",
2476
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2477
              "        )\n",
2478
              "        (inner_cross_attn): CrossAttention(\n",
2479
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2480
              "        )\n",
2481
              "      )\n",
2482
              "      (mlp): MLP(\n",
2483
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2484
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2485
              "        (act): NewGELUActivation()\n",
2486
              "      )\n",
2487
              "    )\n",
2488
              "    (2): ParallelBlock(\n",
2489
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2490
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2491
              "      (mixer): MHA(\n",
2492
              "        (rotary_emb): RotaryEmbedding()\n",
2493
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2494
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2495
              "        (inner_attn): SelfAttention(\n",
2496
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2497
              "        )\n",
2498
              "        (inner_cross_attn): CrossAttention(\n",
2499
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2500
              "        )\n",
2501
              "      )\n",
2502
              "      (mlp): MLP(\n",
2503
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2504
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2505
              "        (act): NewGELUActivation()\n",
2506
              "      )\n",
2507
              "    )\n",
2508
              "    (3): ParallelBlock(\n",
2509
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2510
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2511
              "      (mixer): MHA(\n",
2512
              "        (rotary_emb): RotaryEmbedding()\n",
2513
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2514
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2515
              "        (inner_attn): SelfAttention(\n",
2516
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2517
              "        )\n",
2518
              "        (inner_cross_attn): CrossAttention(\n",
2519
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2520
              "        )\n",
2521
              "      )\n",
2522
              "      (mlp): MLP(\n",
2523
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2524
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2525
              "        (act): NewGELUActivation()\n",
2526
              "      )\n",
2527
              "    )\n",
2528
              "    (4): ParallelBlock(\n",
2529
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2530
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2531
              "      (mixer): MHA(\n",
2532
              "        (rotary_emb): RotaryEmbedding()\n",
2533
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2534
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2535
              "        (inner_attn): SelfAttention(\n",
2536
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2537
              "        )\n",
2538
              "        (inner_cross_attn): CrossAttention(\n",
2539
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2540
              "        )\n",
2541
              "      )\n",
2542
              "      (mlp): MLP(\n",
2543
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2544
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2545
              "        (act): NewGELUActivation()\n",
2546
              "      )\n",
2547
              "    )\n",
2548
              "    (5): ParallelBlock(\n",
2549
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2550
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2551
              "      (mixer): MHA(\n",
2552
              "        (rotary_emb): RotaryEmbedding()\n",
2553
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2554
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2555
              "        (inner_attn): SelfAttention(\n",
2556
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2557
              "        )\n",
2558
              "        (inner_cross_attn): CrossAttention(\n",
2559
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2560
              "        )\n",
2561
              "      )\n",
2562
              "      (mlp): MLP(\n",
2563
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2564
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2565
              "        (act): NewGELUActivation()\n",
2566
              "      )\n",
2567
              "    )\n",
2568
              "    (6): ParallelBlock(\n",
2569
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2570
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2571
              "      (mixer): MHA(\n",
2572
              "        (rotary_emb): RotaryEmbedding()\n",
2573
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2574
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2575
              "        (inner_attn): SelfAttention(\n",
2576
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2577
              "        )\n",
2578
              "        (inner_cross_attn): CrossAttention(\n",
2579
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2580
              "        )\n",
2581
              "      )\n",
2582
              "      (mlp): MLP(\n",
2583
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2584
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2585
              "        (act): NewGELUActivation()\n",
2586
              "      )\n",
2587
              "    )\n",
2588
              "    (7): ParallelBlock(\n",
2589
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2590
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2591
              "      (mixer): MHA(\n",
2592
              "        (rotary_emb): RotaryEmbedding()\n",
2593
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2594
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2595
              "        (inner_attn): SelfAttention(\n",
2596
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2597
              "        )\n",
2598
              "        (inner_cross_attn): CrossAttention(\n",
2599
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2600
              "        )\n",
2601
              "      )\n",
2602
              "      (mlp): MLP(\n",
2603
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2604
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2605
              "        (act): NewGELUActivation()\n",
2606
              "      )\n",
2607
              "    )\n",
2608
              "    (8): ParallelBlock(\n",
2609
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2610
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2611
              "      (mixer): MHA(\n",
2612
              "        (rotary_emb): RotaryEmbedding()\n",
2613
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2614
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2615
              "        (inner_attn): SelfAttention(\n",
2616
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2617
              "        )\n",
2618
              "        (inner_cross_attn): CrossAttention(\n",
2619
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2620
              "        )\n",
2621
              "      )\n",
2622
              "      (mlp): MLP(\n",
2623
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2624
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2625
              "        (act): NewGELUActivation()\n",
2626
              "      )\n",
2627
              "    )\n",
2628
              "    (9): ParallelBlock(\n",
2629
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2630
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2631
              "      (mixer): MHA(\n",
2632
              "        (rotary_emb): RotaryEmbedding()\n",
2633
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2634
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2635
              "        (inner_attn): SelfAttention(\n",
2636
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2637
              "        )\n",
2638
              "        (inner_cross_attn): CrossAttention(\n",
2639
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2640
              "        )\n",
2641
              "      )\n",
2642
              "      (mlp): MLP(\n",
2643
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2644
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2645
              "        (act): NewGELUActivation()\n",
2646
              "      )\n",
2647
              "    )\n",
2648
              "    (10): ParallelBlock(\n",
2649
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2650
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2651
              "      (mixer): MHA(\n",
2652
              "        (rotary_emb): RotaryEmbedding()\n",
2653
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2654
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2655
              "        (inner_attn): SelfAttention(\n",
2656
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2657
              "        )\n",
2658
              "        (inner_cross_attn): CrossAttention(\n",
2659
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2660
              "        )\n",
2661
              "      )\n",
2662
              "      (mlp): MLP(\n",
2663
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2664
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2665
              "        (act): NewGELUActivation()\n",
2666
              "      )\n",
2667
              "    )\n",
2668
              "    (11): ParallelBlock(\n",
2669
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2670
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2671
              "      (mixer): MHA(\n",
2672
              "        (rotary_emb): RotaryEmbedding()\n",
2673
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2674
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2675
              "        (inner_attn): SelfAttention(\n",
2676
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2677
              "        )\n",
2678
              "        (inner_cross_attn): CrossAttention(\n",
2679
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2680
              "        )\n",
2681
              "      )\n",
2682
              "      (mlp): MLP(\n",
2683
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2684
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2685
              "        (act): NewGELUActivation()\n",
2686
              "      )\n",
2687
              "    )\n",
2688
              "    (12): ParallelBlock(\n",
2689
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2690
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2691
              "      (mixer): MHA(\n",
2692
              "        (rotary_emb): RotaryEmbedding()\n",
2693
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2694
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2695
              "        (inner_attn): SelfAttention(\n",
2696
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2697
              "        )\n",
2698
              "        (inner_cross_attn): CrossAttention(\n",
2699
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2700
              "        )\n",
2701
              "      )\n",
2702
              "      (mlp): MLP(\n",
2703
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2704
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2705
              "        (act): NewGELUActivation()\n",
2706
              "      )\n",
2707
              "    )\n",
2708
              "    (13): ParallelBlock(\n",
2709
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2710
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2711
              "      (mixer): MHA(\n",
2712
              "        (rotary_emb): RotaryEmbedding()\n",
2713
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2714
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2715
              "        (inner_attn): SelfAttention(\n",
2716
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2717
              "        )\n",
2718
              "        (inner_cross_attn): CrossAttention(\n",
2719
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2720
              "        )\n",
2721
              "      )\n",
2722
              "      (mlp): MLP(\n",
2723
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2724
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2725
              "        (act): NewGELUActivation()\n",
2726
              "      )\n",
2727
              "    )\n",
2728
              "    (14): ParallelBlock(\n",
2729
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2730
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2731
              "      (mixer): MHA(\n",
2732
              "        (rotary_emb): RotaryEmbedding()\n",
2733
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2734
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2735
              "        (inner_attn): SelfAttention(\n",
2736
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2737
              "        )\n",
2738
              "        (inner_cross_attn): CrossAttention(\n",
2739
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2740
              "        )\n",
2741
              "      )\n",
2742
              "      (mlp): MLP(\n",
2743
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2744
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2745
              "        (act): NewGELUActivation()\n",
2746
              "      )\n",
2747
              "    )\n",
2748
              "    (15): ParallelBlock(\n",
2749
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2750
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2751
              "      (mixer): MHA(\n",
2752
              "        (rotary_emb): RotaryEmbedding()\n",
2753
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2754
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2755
              "        (inner_attn): SelfAttention(\n",
2756
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2757
              "        )\n",
2758
              "        (inner_cross_attn): CrossAttention(\n",
2759
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2760
              "        )\n",
2761
              "      )\n",
2762
              "      (mlp): MLP(\n",
2763
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2764
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2765
              "        (act): NewGELUActivation()\n",
2766
              "      )\n",
2767
              "    )\n",
2768
              "    (16): ParallelBlock(\n",
2769
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2770
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2771
              "      (mixer): MHA(\n",
2772
              "        (rotary_emb): RotaryEmbedding()\n",
2773
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2774
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2775
              "        (inner_attn): SelfAttention(\n",
2776
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2777
              "        )\n",
2778
              "        (inner_cross_attn): CrossAttention(\n",
2779
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2780
              "        )\n",
2781
              "      )\n",
2782
              "      (mlp): MLP(\n",
2783
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2784
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2785
              "        (act): NewGELUActivation()\n",
2786
              "      )\n",
2787
              "    )\n",
2788
              "    (17): ParallelBlock(\n",
2789
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2790
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2791
              "      (mixer): MHA(\n",
2792
              "        (rotary_emb): RotaryEmbedding()\n",
2793
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2794
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2795
              "        (inner_attn): SelfAttention(\n",
2796
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2797
              "        )\n",
2798
              "        (inner_cross_attn): CrossAttention(\n",
2799
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2800
              "        )\n",
2801
              "      )\n",
2802
              "      (mlp): MLP(\n",
2803
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2804
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2805
              "        (act): NewGELUActivation()\n",
2806
              "      )\n",
2807
              "    )\n",
2808
              "    (18): ParallelBlock(\n",
2809
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2810
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2811
              "      (mixer): MHA(\n",
2812
              "        (rotary_emb): RotaryEmbedding()\n",
2813
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2814
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2815
              "        (inner_attn): SelfAttention(\n",
2816
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2817
              "        )\n",
2818
              "        (inner_cross_attn): CrossAttention(\n",
2819
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2820
              "        )\n",
2821
              "      )\n",
2822
              "      (mlp): MLP(\n",
2823
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2824
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2825
              "        (act): NewGELUActivation()\n",
2826
              "      )\n",
2827
              "    )\n",
2828
              "    (19): ParallelBlock(\n",
2829
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2830
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2831
              "      (mixer): MHA(\n",
2832
              "        (rotary_emb): RotaryEmbedding()\n",
2833
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2834
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2835
              "        (inner_attn): SelfAttention(\n",
2836
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2837
              "        )\n",
2838
              "        (inner_cross_attn): CrossAttention(\n",
2839
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2840
              "        )\n",
2841
              "      )\n",
2842
              "      (mlp): MLP(\n",
2843
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2844
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2845
              "        (act): NewGELUActivation()\n",
2846
              "      )\n",
2847
              "    )\n",
2848
              "    (20): ParallelBlock(\n",
2849
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2850
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2851
              "      (mixer): MHA(\n",
2852
              "        (rotary_emb): RotaryEmbedding()\n",
2853
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2854
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2855
              "        (inner_attn): SelfAttention(\n",
2856
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2857
              "        )\n",
2858
              "        (inner_cross_attn): CrossAttention(\n",
2859
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2860
              "        )\n",
2861
              "      )\n",
2862
              "      (mlp): MLP(\n",
2863
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2864
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2865
              "        (act): NewGELUActivation()\n",
2866
              "      )\n",
2867
              "    )\n",
2868
              "    (21): ParallelBlock(\n",
2869
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2870
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2871
              "      (mixer): MHA(\n",
2872
              "        (rotary_emb): RotaryEmbedding()\n",
2873
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2874
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2875
              "        (inner_attn): SelfAttention(\n",
2876
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2877
              "        )\n",
2878
              "        (inner_cross_attn): CrossAttention(\n",
2879
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2880
              "        )\n",
2881
              "      )\n",
2882
              "      (mlp): MLP(\n",
2883
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2884
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2885
              "        (act): NewGELUActivation()\n",
2886
              "      )\n",
2887
              "    )\n",
2888
              "    (22): ParallelBlock(\n",
2889
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2890
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2891
              "      (mixer): MHA(\n",
2892
              "        (rotary_emb): RotaryEmbedding()\n",
2893
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2894
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2895
              "        (inner_attn): SelfAttention(\n",
2896
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2897
              "        )\n",
2898
              "        (inner_cross_attn): CrossAttention(\n",
2899
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2900
              "        )\n",
2901
              "      )\n",
2902
              "      (mlp): MLP(\n",
2903
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2904
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2905
              "        (act): NewGELUActivation()\n",
2906
              "      )\n",
2907
              "    )\n",
2908
              "    (23): ParallelBlock(\n",
2909
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2910
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2911
              "      (mixer): MHA(\n",
2912
              "        (rotary_emb): RotaryEmbedding()\n",
2913
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2914
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2915
              "        (inner_attn): SelfAttention(\n",
2916
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2917
              "        )\n",
2918
              "        (inner_cross_attn): CrossAttention(\n",
2919
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2920
              "        )\n",
2921
              "      )\n",
2922
              "      (mlp): MLP(\n",
2923
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2924
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2925
              "        (act): NewGELUActivation()\n",
2926
              "      )\n",
2927
              "    )\n",
2928
              "    (24): ParallelBlock(\n",
2929
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2930
              "      (resid_dropout): Dropout(p=0.0, inplace=False)\n",
2931
              "      (mixer): MHA(\n",
2932
              "        (rotary_emb): RotaryEmbedding()\n",
2933
              "        (Wqkv): Linear(in_features=2048, out_features=6144, bias=True)\n",
2934
              "        (out_proj): Linear(in_features=2048, out_features=2048, bias=True)\n",
2935
              "        (inner_attn): SelfAttention(\n",
2936
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2937
              "        )\n",
2938
              "        (inner_cross_attn): CrossAttention(\n",
2939
              "          (drop): Dropout(p=0.0, inplace=False)\n",
2940
              "        )\n",
2941
              "      )\n",
2942
              "      (mlp): MLP(\n",
2943
              "        (fc1): Linear(in_features=2048, out_features=8192, bias=True)\n",
2944
              "        (fc2): Linear(in_features=8192, out_features=2048, bias=True)\n",
2945
              "        (act): NewGELUActivation()\n",
2946
              "      )\n",
2947
              "    )\n",
2948
              "    (25): CausalLMHead(\n",
2949
              "      (ln): LayerNorm((2048,), eps=1e-05, elementwise_affine=True)\n",
2950
              "      (linear): Linear(in_features=2048, out_features=51200, bias=True)\n",
2951
              "    )\n",
2952
              "  )\n",
2953
              "  (loss): CausalLMLoss(\n",
2954
              "    (loss_fct): CrossEntropyLoss()\n",
2955
              "  )\n",
2956
              ")"
2957
            ]
2958
          },
2959
          "metadata": {},
2960
          "execution_count": 1
2961
        }
2962
      ]
2963
    },
2964
    {
2965
      "cell_type": "code",
2966
      "source": [
2967
        "import torch\n",
2968
        "from transformers import AutoModelForCausalLM, AutoTokenizer\n",
2969
        "\n",
2970
        "model = AutoModelForCausalLM.from_pretrained(\"ashishpatel26/phi-1_5-finetuned-dialogstudio\", trust_remote_code=True, torch_dtype=torch.float32)\n",
2971
        "tokenizer = AutoTokenizer.from_pretrained(\"microsoft/phi-1_5\", trust_remote_code=True)\n",
2972
        "inputs = tokenizer(f'''{dataset[\"test\"]['text'][0]}''', return_tensors=\"pt\", return_attention_mask=False)\n",
2973
        "\n",
2974
        "outputs = model.generate(**inputs, max_length=512)\n",
2975
        "text = tokenizer.batch_decode(outputs)[0]\n",
2976
        "print(text)"
2977
      ],
2978
      "metadata": {
2979
        "id": "vpbzxK0zhHk8"
2980
      },
2981
      "execution_count": null,
2982
      "outputs": []
2983
    },
2984
    {
2985
      "cell_type": "code",
2986
      "source": [
2987
        "# dataset[\"test\"]['text'][0]"
2988
      ],
2989
      "metadata": {
2990
        "colab": {
2991
          "base_uri": "https://localhost:8080/",
2992
          "height": 139
2993
        },
2994
        "id": "oU9augJbhm44",
2995
        "outputId": "f85452c7-96a7-47e0-d3e8-52a7b12573aa"
2996
      },
2997
      "execution_count": 19,
2998
      "outputs": [
2999
        {
3000
          "output_type": "execute_result",
3001
          "data": {
3002
            "text/plain": [
3003
              "'### Instruction: Below is a conversation between a human and an AI agent. Write a summary of the conversation.\\n\\n### Input:\\nuser: looking to change my flight Friday, Oct 27. GRMSKV to DL4728 from SLC to ORD. Is that an option and what is the cost? Jess\\nagent: The difference in fare is $185.30. This would include all airport taxes and fees. The ticket is non-refundable changeable with a fee, *ALS and may result in additional fare collection for changes when making a future changes. *ALS\\nuser: I had a first class seat purchased for the original flight, would that be the same with this flight to Chicago?\\nagent: Hello, Jess. That is the fare difference. You will have to call us at 1 800 221 1212 to make any changes. It is in First class. *TAY\\nuser: thx\\nagent: Our pleasure. *ALS\\nuser: Do I have to call or is there a means to do this online?\\nagent: You can call or you can login to your trip on our website to make changes. *TJE\\n\\n### Response:\\nCustomer is looking to change the flight on Friday Oct 27 is that an option and asking about cost. Agent replying that there is an difference in fare and this would include all airport taxes and fees and ticket is non refundable changeable with a fee.'"
3004
            ],
3005
            "application/vnd.google.colaboratory.intrinsic+json": {
3006
              "type": "string"
3007
            }
3008
          },
3009
          "metadata": {},
3010
          "execution_count": 19
3011
        }
3012
      ]
3013
    },
3014
    {
3015
      "cell_type": "markdown",
3016
      "metadata": {
3017
        "id": "pfxoP-IvnheQ"
3018
      },
3019
      "source": [
3020
        "## References\n",
3021
        "\n",
3022
        "- https://huggingface.co/datasets/Salesforce/dialogstudio\n",
3023
        "- https://huggingface.co/meta-llama/Llama-2-7b-hf"
3024
      ]
3025
    }
3026
  ],
3027
  "metadata": {
3028
    "accelerator": "GPU",
3029
    "colab": {
3030
      "provenance": [],
3031
      "gpuType": "T4",
3032
      "include_colab_link": true
3033
    },
3034
    "kernelspec": {
3035
      "display_name": "Python 3",
3036
      "name": "python3"
3037
    },
3038
    "language_info": {
3039
      "name": "python"
3040
    },
3041
    "widgets": {
3042
      "application/vnd.jupyter.widget-state+json": {
3043
        "96ef5be98b5c4f2c9945b1a8c0989d7b": {
3044
          "model_module": "@jupyter-widgets/controls",
3045
          "model_name": "VBoxModel",
3046
          "model_module_version": "1.5.0",
3047
          "state": {
3048
            "_dom_classes": [],
3049
            "_model_module": "@jupyter-widgets/controls",
3050
            "_model_module_version": "1.5.0",
3051
            "_model_name": "VBoxModel",
3052
            "_view_count": null,
3053
            "_view_module": "@jupyter-widgets/controls",
3054
            "_view_module_version": "1.5.0",
3055
            "_view_name": "VBoxView",
3056
            "box_style": "",
3057
            "children": [
3058
              "IPY_MODEL_2cf7de58a08f4a10a0388fd5284adc61",
3059
              "IPY_MODEL_3e55c582114c43d19f9a88819739d9a5",
3060
              "IPY_MODEL_cdd259b528bf4cd7b1c2f834cec0372d",
3061
              "IPY_MODEL_1440bf6528a844f399aea3997b0348ba"
3062
            ],
3063
            "layout": "IPY_MODEL_a68cf26cf964423b8ce413bc6c8c5299"
3064
          }
3065
        },
3066
        "29aca8e4365b4bee99d5292d8e74cdd6": {
3067
          "model_module": "@jupyter-widgets/controls",
3068
          "model_name": "HTMLModel",
3069
          "model_module_version": "1.5.0",
3070
          "state": {
3071
            "_dom_classes": [],
3072
            "_model_module": "@jupyter-widgets/controls",
3073
            "_model_module_version": "1.5.0",
3074
            "_model_name": "HTMLModel",
3075
            "_view_count": null,
3076
            "_view_module": "@jupyter-widgets/controls",
3077
            "_view_module_version": "1.5.0",
3078
            "_view_name": "HTMLView",
3079
            "description": "",
3080
            "description_tooltip": null,
3081
            "layout": "IPY_MODEL_ed2f736177914d2abb1c2efb6ecce6bb",
3082
            "placeholder": "​",
3083
            "style": "IPY_MODEL_6c2ff22a40b543b6ac26ccd2b7298a61",
3084
            "value": "<center> <img\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.svg\nalt='Hugging Face'> <br> Copy a token from <a\nhref=\"https://huggingface.co/settings/tokens\" target=\"_blank\">your Hugging Face\ntokens page</a> and paste it below. <br> Immediately click login after copying\nyour token or it might be stored in plain text in this notebook file. </center>"
3085
          }
3086
        },
3087
        "c83294f6ba864858a05d5222d84eb0c3": {
3088
          "model_module": "@jupyter-widgets/controls",
3089
          "model_name": "PasswordModel",
3090
          "model_module_version": "1.5.0",
3091
          "state": {
3092
            "_dom_classes": [],
3093
            "_model_module": "@jupyter-widgets/controls",
3094
            "_model_module_version": "1.5.0",
3095
            "_model_name": "PasswordModel",
3096
            "_view_count": null,
3097
            "_view_module": "@jupyter-widgets/controls",
3098
            "_view_module_version": "1.5.0",
3099
            "_view_name": "PasswordView",
3100
            "continuous_update": true,
3101
            "description": "Token:",
3102
            "description_tooltip": null,
3103
            "disabled": false,
3104
            "layout": "IPY_MODEL_bb5fc1bf3f4c465e8b0846f22e71a23b",
3105
            "placeholder": "​",
3106
            "style": "IPY_MODEL_42cae2119e5e49b9b7250a6f96f373bc",
3107
            "value": ""
3108
          }
3109
        },
3110
        "7254587396ba4701835ee666ee3b697b": {
3111
          "model_module": "@jupyter-widgets/controls",
3112
          "model_name": "CheckboxModel",
3113
          "model_module_version": "1.5.0",
3114
          "state": {
3115
            "_dom_classes": [],
3116
            "_model_module": "@jupyter-widgets/controls",
3117
            "_model_module_version": "1.5.0",
3118
            "_model_name": "CheckboxModel",
3119
            "_view_count": null,
3120
            "_view_module": "@jupyter-widgets/controls",
3121
            "_view_module_version": "1.5.0",
3122
            "_view_name": "CheckboxView",
3123
            "description": "Add token as git credential?",
3124
            "description_tooltip": null,
3125
            "disabled": false,
3126
            "indent": true,
3127
            "layout": "IPY_MODEL_8701e3ece5b04773a157dacc8f793374",
3128
            "style": "IPY_MODEL_b3b75ce135e049bbacd598eac3d579ce",
3129
            "value": true
3130
          }
3131
        },
3132
        "896def48ce8148f18a13b0a46d0919b3": {
3133
          "model_module": "@jupyter-widgets/controls",
3134
          "model_name": "ButtonModel",
3135
          "model_module_version": "1.5.0",
3136
          "state": {
3137
            "_dom_classes": [],
3138
            "_model_module": "@jupyter-widgets/controls",
3139
            "_model_module_version": "1.5.0",
3140
            "_model_name": "ButtonModel",
3141
            "_view_count": null,
3142
            "_view_module": "@jupyter-widgets/controls",
3143
            "_view_module_version": "1.5.0",
3144
            "_view_name": "ButtonView",
3145
            "button_style": "",
3146
            "description": "Login",
3147
            "disabled": false,
3148
            "icon": "",
3149
            "layout": "IPY_MODEL_6bb60bf24297418384b709e106c6c71a",
3150
            "style": "IPY_MODEL_4b209751747c4ff98d905702b4ba3ab6",
3151
            "tooltip": ""
3152
          }
3153
        },
3154
        "5bce118ef58b43b6ab295e6272d84668": {
3155
          "model_module": "@jupyter-widgets/controls",
3156
          "model_name": "HTMLModel",
3157
          "model_module_version": "1.5.0",
3158
          "state": {
3159
            "_dom_classes": [],
3160
            "_model_module": "@jupyter-widgets/controls",
3161
            "_model_module_version": "1.5.0",
3162
            "_model_name": "HTMLModel",
3163
            "_view_count": null,
3164
            "_view_module": "@jupyter-widgets/controls",
3165
            "_view_module_version": "1.5.0",
3166
            "_view_name": "HTMLView",
3167
            "description": "",
3168
            "description_tooltip": null,
3169
            "layout": "IPY_MODEL_ca3fcc5229864c2d8030b8e1bce3680a",
3170
            "placeholder": "​",
3171
            "style": "IPY_MODEL_e43a98b2e5ba41a5a483c9320f982960",
3172
            "value": "\n<b>Pro Tip:</b> If you don't already have one, you can create a dedicated\n'notebooks' token with 'write' access, that you can then easily reuse for all\nnotebooks. </center>"
3173
          }
3174
        },
3175
        "a68cf26cf964423b8ce413bc6c8c5299": {
3176
          "model_module": "@jupyter-widgets/base",
3177
          "model_name": "LayoutModel",
3178
          "model_module_version": "1.2.0",
3179
          "state": {
3180
            "_model_module": "@jupyter-widgets/base",
3181
            "_model_module_version": "1.2.0",
3182
            "_model_name": "LayoutModel",
3183
            "_view_count": null,
3184
            "_view_module": "@jupyter-widgets/base",
3185
            "_view_module_version": "1.2.0",
3186
            "_view_name": "LayoutView",
3187
            "align_content": null,
3188
            "align_items": "center",
3189
            "align_self": null,
3190
            "border": null,
3191
            "bottom": null,
3192
            "display": "flex",
3193
            "flex": null,
3194
            "flex_flow": "column",
3195
            "grid_area": null,
3196
            "grid_auto_columns": null,
3197
            "grid_auto_flow": null,
3198
            "grid_auto_rows": null,
3199
            "grid_column": null,
3200
            "grid_gap": null,
3201
            "grid_row": null,
3202
            "grid_template_areas": null,
3203
            "grid_template_columns": null,
3204
            "grid_template_rows": null,
3205
            "height": null,
3206
            "justify_content": null,
3207
            "justify_items": null,
3208
            "left": null,
3209
            "margin": null,
3210
            "max_height": null,
3211
            "max_width": null,
3212
            "min_height": null,
3213
            "min_width": null,
3214
            "object_fit": null,
3215
            "object_position": null,
3216
            "order": null,
3217
            "overflow": null,
3218
            "overflow_x": null,
3219
            "overflow_y": null,
3220
            "padding": null,
3221
            "right": null,
3222
            "top": null,
3223
            "visibility": null,
3224
            "width": "50%"
3225
          }
3226
        },
3227
        "ed2f736177914d2abb1c2efb6ecce6bb": {
3228
          "model_module": "@jupyter-widgets/base",
3229
          "model_name": "LayoutModel",
3230
          "model_module_version": "1.2.0",
3231
          "state": {
3232
            "_model_module": "@jupyter-widgets/base",
3233
            "_model_module_version": "1.2.0",
3234
            "_model_name": "LayoutModel",
3235
            "_view_count": null,
3236
            "_view_module": "@jupyter-widgets/base",
3237
            "_view_module_version": "1.2.0",
3238
            "_view_name": "LayoutView",
3239
            "align_content": null,
3240
            "align_items": null,
3241
            "align_self": null,
3242
            "border": null,
3243
            "bottom": null,
3244
            "display": null,
3245
            "flex": null,
3246
            "flex_flow": null,
3247
            "grid_area": null,
3248
            "grid_auto_columns": null,
3249
            "grid_auto_flow": null,
3250
            "grid_auto_rows": null,
3251
            "grid_column": null,
3252
            "grid_gap": null,
3253
            "grid_row": null,
3254
            "grid_template_areas": null,
3255
            "grid_template_columns": null,
3256
            "grid_template_rows": null,
3257
            "height": null,
3258
            "justify_content": null,
3259
            "justify_items": null,
3260
            "left": null,
3261
            "margin": null,
3262
            "max_height": null,
3263
            "max_width": null,
3264
            "min_height": null,
3265
            "min_width": null,
3266
            "object_fit": null,
3267
            "object_position": null,
3268
            "order": null,
3269
            "overflow": null,
3270
            "overflow_x": null,
3271
            "overflow_y": null,
3272
            "padding": null,
3273
            "right": null,
3274
            "top": null,
3275
            "visibility": null,
3276
            "width": null
3277
          }
3278
        },
3279
        "6c2ff22a40b543b6ac26ccd2b7298a61": {
3280
          "model_module": "@jupyter-widgets/controls",
3281
          "model_name": "DescriptionStyleModel",
3282
          "model_module_version": "1.5.0",
3283
          "state": {
3284
            "_model_module": "@jupyter-widgets/controls",
3285
            "_model_module_version": "1.5.0",
3286
            "_model_name": "DescriptionStyleModel",
3287
            "_view_count": null,
3288
            "_view_module": "@jupyter-widgets/base",
3289
            "_view_module_version": "1.2.0",
3290
            "_view_name": "StyleView",
3291
            "description_width": ""
3292
          }
3293
        },
3294
        "bb5fc1bf3f4c465e8b0846f22e71a23b": {
3295
          "model_module": "@jupyter-widgets/base",
3296
          "model_name": "LayoutModel",
3297
          "model_module_version": "1.2.0",
3298
          "state": {
3299
            "_model_module": "@jupyter-widgets/base",
3300
            "_model_module_version": "1.2.0",
3301
            "_model_name": "LayoutModel",
3302
            "_view_count": null,
3303
            "_view_module": "@jupyter-widgets/base",
3304
            "_view_module_version": "1.2.0",
3305
            "_view_name": "LayoutView",
3306
            "align_content": null,
3307
            "align_items": null,
3308
            "align_self": null,
3309
            "border": null,
3310
            "bottom": null,
3311
            "display": null,
3312
            "flex": null,
3313
            "flex_flow": null,
3314
            "grid_area": null,
3315
            "grid_auto_columns": null,
3316
            "grid_auto_flow": null,
3317
            "grid_auto_rows": null,
3318
            "grid_column": null,
3319
            "grid_gap": null,
3320
            "grid_row": null,
3321
            "grid_template_areas": null,
3322
            "grid_template_columns": null,
3323
            "grid_template_rows": null,
3324
            "height": null,
3325
            "justify_content": null,
3326
            "justify_items": null,
3327
            "left": null,
3328
            "margin": null,
3329
            "max_height": null,
3330
            "max_width": null,
3331
            "min_height": null,
3332
            "min_width": null,
3333
            "object_fit": null,
3334
            "object_position": null,
3335
            "order": null,
3336
            "overflow": null,
3337
            "overflow_x": null,
3338
            "overflow_y": null,
3339
            "padding": null,
3340
            "right": null,
3341
            "top": null,
3342
            "visibility": null,
3343
            "width": null
3344
          }
3345
        },
3346
        "42cae2119e5e49b9b7250a6f96f373bc": {
3347
          "model_module": "@jupyter-widgets/controls",
3348
          "model_name": "DescriptionStyleModel",
3349
          "model_module_version": "1.5.0",
3350
          "state": {
3351
            "_model_module": "@jupyter-widgets/controls",
3352
            "_model_module_version": "1.5.0",
3353
            "_model_name": "DescriptionStyleModel",
3354
            "_view_count": null,
3355
            "_view_module": "@jupyter-widgets/base",
3356
            "_view_module_version": "1.2.0",
3357
            "_view_name": "StyleView",
3358
            "description_width": ""
3359
          }
3360
        },
3361
        "8701e3ece5b04773a157dacc8f793374": {
3362
          "model_module": "@jupyter-widgets/base",
3363
          "model_name": "LayoutModel",
3364
          "model_module_version": "1.2.0",
3365
          "state": {
3366
            "_model_module": "@jupyter-widgets/base",
3367
            "_model_module_version": "1.2.0",
3368
            "_model_name": "LayoutModel",
3369
            "_view_count": null,
3370
            "_view_module": "@jupyter-widgets/base",
3371
            "_view_module_version": "1.2.0",
3372
            "_view_name": "LayoutView",
3373
            "align_content": null,
3374
            "align_items": null,
3375
            "align_self": null,
3376
            "border": null,
3377
            "bottom": null,
3378
            "display": null,
3379
            "flex": null,
3380
            "flex_flow": null,
3381
            "grid_area": null,
3382
            "grid_auto_columns": null,
3383
            "grid_auto_flow": null,
3384
            "grid_auto_rows": null,
3385
            "grid_column": null,
3386
            "grid_gap": null,
3387
            "grid_row": null,
3388
            "grid_template_areas": null,
3389
            "grid_template_columns": null,
3390
            "grid_template_rows": null,
3391
            "height": null,
3392
            "justify_content": null,
3393
            "justify_items": null,
3394
            "left": null,
3395
            "margin": null,
3396
            "max_height": null,
3397
            "max_width": null,
3398
            "min_height": null,
3399
            "min_width": null,
3400
            "object_fit": null,
3401
            "object_position": null,
3402
            "order": null,
3403
            "overflow": null,
3404
            "overflow_x": null,
3405
            "overflow_y": null,
3406
            "padding": null,
3407
            "right": null,
3408
            "top": null,
3409
            "visibility": null,
3410
            "width": null
3411
          }
3412
        },
3413
        "b3b75ce135e049bbacd598eac3d579ce": {
3414
          "model_module": "@jupyter-widgets/controls",
3415
          "model_name": "DescriptionStyleModel",
3416
          "model_module_version": "1.5.0",
3417
          "state": {
3418
            "_model_module": "@jupyter-widgets/controls",
3419
            "_model_module_version": "1.5.0",
3420
            "_model_name": "DescriptionStyleModel",
3421
            "_view_count": null,
3422
            "_view_module": "@jupyter-widgets/base",
3423
            "_view_module_version": "1.2.0",
3424
            "_view_name": "StyleView",
3425
            "description_width": ""
3426
          }
3427
        },
3428
        "6bb60bf24297418384b709e106c6c71a": {
3429
          "model_module": "@jupyter-widgets/base",
3430
          "model_name": "LayoutModel",
3431
          "model_module_version": "1.2.0",
3432
          "state": {
3433
            "_model_module": "@jupyter-widgets/base",
3434
            "_model_module_version": "1.2.0",
3435
            "_model_name": "LayoutModel",
3436
            "_view_count": null,
3437
            "_view_module": "@jupyter-widgets/base",
3438
            "_view_module_version": "1.2.0",
3439
            "_view_name": "LayoutView",
3440
            "align_content": null,
3441
            "align_items": null,
3442
            "align_self": null,
3443
            "border": null,
3444
            "bottom": null,
3445
            "display": null,
3446
            "flex": null,
3447
            "flex_flow": null,
3448
            "grid_area": null,
3449
            "grid_auto_columns": null,
3450
            "grid_auto_flow": null,
3451
            "grid_auto_rows": null,
3452
            "grid_column": null,
3453
            "grid_gap": null,
3454
            "grid_row": null,
3455
            "grid_template_areas": null,
3456
            "grid_template_columns": null,
3457
            "grid_template_rows": null,
3458
            "height": null,
3459
            "justify_content": null,
3460
            "justify_items": null,
3461
            "left": null,
3462
            "margin": null,
3463
            "max_height": null,
3464
            "max_width": null,
3465
            "min_height": null,
3466
            "min_width": null,
3467
            "object_fit": null,
3468
            "object_position": null,
3469
            "order": null,
3470
            "overflow": null,
3471
            "overflow_x": null,
3472
            "overflow_y": null,
3473
            "padding": null,
3474
            "right": null,
3475
            "top": null,
3476
            "visibility": null,
3477
            "width": null
3478
          }
3479
        },
3480
        "4b209751747c4ff98d905702b4ba3ab6": {
3481
          "model_module": "@jupyter-widgets/controls",
3482
          "model_name": "ButtonStyleModel",
3483
          "model_module_version": "1.5.0",
3484
          "state": {
3485
            "_model_module": "@jupyter-widgets/controls",
3486
            "_model_module_version": "1.5.0",
3487
            "_model_name": "ButtonStyleModel",
3488
            "_view_count": null,
3489
            "_view_module": "@jupyter-widgets/base",
3490
            "_view_module_version": "1.2.0",
3491
            "_view_name": "StyleView",
3492
            "button_color": null,
3493
            "font_weight": ""
3494
          }
3495
        },
3496
        "ca3fcc5229864c2d8030b8e1bce3680a": {
3497
          "model_module": "@jupyter-widgets/base",
3498
          "model_name": "LayoutModel",
3499
          "model_module_version": "1.2.0",
3500
          "state": {
3501
            "_model_module": "@jupyter-widgets/base",
3502
            "_model_module_version": "1.2.0",
3503
            "_model_name": "LayoutModel",
3504
            "_view_count": null,
3505
            "_view_module": "@jupyter-widgets/base",
3506
            "_view_module_version": "1.2.0",
3507
            "_view_name": "LayoutView",
3508
            "align_content": null,
3509
            "align_items": null,
3510
            "align_self": null,
3511
            "border": null,
3512
            "bottom": null,
3513
            "display": null,
3514
            "flex": null,
3515
            "flex_flow": null,
3516
            "grid_area": null,
3517
            "grid_auto_columns": null,
3518
            "grid_auto_flow": null,
3519
            "grid_auto_rows": null,
3520
            "grid_column": null,
3521
            "grid_gap": null,
3522
            "grid_row": null,
3523
            "grid_template_areas": null,
3524
            "grid_template_columns": null,
3525
            "grid_template_rows": null,
3526
            "height": null,
3527
            "justify_content": null,
3528
            "justify_items": null,
3529
            "left": null,
3530
            "margin": null,
3531
            "max_height": null,
3532
            "max_width": null,
3533
            "min_height": null,
3534
            "min_width": null,
3535
            "object_fit": null,
3536
            "object_position": null,
3537
            "order": null,
3538
            "overflow": null,
3539
            "overflow_x": null,
3540
            "overflow_y": null,
3541
            "padding": null,
3542
            "right": null,
3543
            "top": null,
3544
            "visibility": null,
3545
            "width": null
3546
          }
3547
        },
3548
        "e43a98b2e5ba41a5a483c9320f982960": {
3549
          "model_module": "@jupyter-widgets/controls",
3550
          "model_name": "DescriptionStyleModel",
3551
          "model_module_version": "1.5.0",
3552
          "state": {
3553
            "_model_module": "@jupyter-widgets/controls",
3554
            "_model_module_version": "1.5.0",
3555
            "_model_name": "DescriptionStyleModel",
3556
            "_view_count": null,
3557
            "_view_module": "@jupyter-widgets/base",
3558
            "_view_module_version": "1.2.0",
3559
            "_view_name": "StyleView",
3560
            "description_width": ""
3561
          }
3562
        },
3563
        "f18eecc689234406a32b478a88379011": {
3564
          "model_module": "@jupyter-widgets/controls",
3565
          "model_name": "LabelModel",
3566
          "model_module_version": "1.5.0",
3567
          "state": {
3568
            "_dom_classes": [],
3569
            "_model_module": "@jupyter-widgets/controls",
3570
            "_model_module_version": "1.5.0",
3571
            "_model_name": "LabelModel",
3572
            "_view_count": null,
3573
            "_view_module": "@jupyter-widgets/controls",
3574
            "_view_module_version": "1.5.0",
3575
            "_view_name": "LabelView",
3576
            "description": "",
3577
            "description_tooltip": null,
3578
            "layout": "IPY_MODEL_dc6a98f4481a4d158ffd66d036d9d391",
3579
            "placeholder": "​",
3580
            "style": "IPY_MODEL_c3e8d37c64af4b1eaed0569fd32c3841",
3581
            "value": "Connecting..."
3582
          }
3583
        },
3584
        "dc6a98f4481a4d158ffd66d036d9d391": {
3585
          "model_module": "@jupyter-widgets/base",
3586
          "model_name": "LayoutModel",
3587
          "model_module_version": "1.2.0",
3588
          "state": {
3589
            "_model_module": "@jupyter-widgets/base",
3590
            "_model_module_version": "1.2.0",
3591
            "_model_name": "LayoutModel",
3592
            "_view_count": null,
3593
            "_view_module": "@jupyter-widgets/base",
3594
            "_view_module_version": "1.2.0",
3595
            "_view_name": "LayoutView",
3596
            "align_content": null,
3597
            "align_items": null,
3598
            "align_self": null,
3599
            "border": null,
3600
            "bottom": null,
3601
            "display": null,
3602
            "flex": null,
3603
            "flex_flow": null,
3604
            "grid_area": null,
3605
            "grid_auto_columns": null,
3606
            "grid_auto_flow": null,
3607
            "grid_auto_rows": null,
3608
            "grid_column": null,
3609
            "grid_gap": null,
3610
            "grid_row": null,
3611
            "grid_template_areas": null,
3612
            "grid_template_columns": null,
3613
            "grid_template_rows": null,
3614
            "height": null,
3615
            "justify_content": null,
3616
            "justify_items": null,
3617
            "left": null,
3618
            "margin": null,
3619
            "max_height": null,
3620
            "max_width": null,
3621
            "min_height": null,
3622
            "min_width": null,
3623
            "object_fit": null,
3624
            "object_position": null,
3625
            "order": null,
3626
            "overflow": null,
3627
            "overflow_x": null,
3628
            "overflow_y": null,
3629
            "padding": null,
3630
            "right": null,
3631
            "top": null,
3632
            "visibility": null,
3633
            "width": null
3634
          }
3635
        },
3636
        "c3e8d37c64af4b1eaed0569fd32c3841": {
3637
          "model_module": "@jupyter-widgets/controls",
3638
          "model_name": "DescriptionStyleModel",
3639
          "model_module_version": "1.5.0",
3640
          "state": {
3641
            "_model_module": "@jupyter-widgets/controls",
3642
            "_model_module_version": "1.5.0",
3643
            "_model_name": "DescriptionStyleModel",
3644
            "_view_count": null,
3645
            "_view_module": "@jupyter-widgets/base",
3646
            "_view_module_version": "1.2.0",
3647
            "_view_name": "StyleView",
3648
            "description_width": ""
3649
          }
3650
        },
3651
        "2cf7de58a08f4a10a0388fd5284adc61": {
3652
          "model_module": "@jupyter-widgets/controls",
3653
          "model_name": "LabelModel",
3654
          "model_module_version": "1.5.0",
3655
          "state": {
3656
            "_dom_classes": [],
3657
            "_model_module": "@jupyter-widgets/controls",
3658
            "_model_module_version": "1.5.0",
3659
            "_model_name": "LabelModel",
3660
            "_view_count": null,
3661
            "_view_module": "@jupyter-widgets/controls",
3662
            "_view_module_version": "1.5.0",
3663
            "_view_name": "LabelView",
3664
            "description": "",
3665
            "description_tooltip": null,
3666
            "layout": "IPY_MODEL_60af265316074adab78687ac53070910",
3667
            "placeholder": "​",
3668
            "style": "IPY_MODEL_1c9d8afeb2644c65909f6e689e1af0af",
3669
            "value": "Token is valid (permission: write)."
3670
          }
3671
        },
3672
        "3e55c582114c43d19f9a88819739d9a5": {
3673
          "model_module": "@jupyter-widgets/controls",
3674
          "model_name": "LabelModel",
3675
          "model_module_version": "1.5.0",
3676
          "state": {
3677
            "_dom_classes": [],
3678
            "_model_module": "@jupyter-widgets/controls",
3679
            "_model_module_version": "1.5.0",
3680
            "_model_name": "LabelModel",
3681
            "_view_count": null,
3682
            "_view_module": "@jupyter-widgets/controls",
3683
            "_view_module_version": "1.5.0",
3684
            "_view_name": "LabelView",
3685
            "description": "",
3686
            "description_tooltip": null,
3687
            "layout": "IPY_MODEL_06d7ce85d9784f58add0583feda74530",
3688
            "placeholder": "​",
3689
            "style": "IPY_MODEL_bcacfb2e6c464423b5e8bc0aef675fdd",
3690
            "value": "Your token has been saved in your configured git credential helpers (store)."
3691
          }
3692
        },
3693
        "cdd259b528bf4cd7b1c2f834cec0372d": {
3694
          "model_module": "@jupyter-widgets/controls",
3695
          "model_name": "LabelModel",
3696
          "model_module_version": "1.5.0",
3697
          "state": {
3698
            "_dom_classes": [],
3699
            "_model_module": "@jupyter-widgets/controls",
3700
            "_model_module_version": "1.5.0",
3701
            "_model_name": "LabelModel",
3702
            "_view_count": null,
3703
            "_view_module": "@jupyter-widgets/controls",
3704
            "_view_module_version": "1.5.0",
3705
            "_view_name": "LabelView",
3706
            "description": "",
3707
            "description_tooltip": null,
3708
            "layout": "IPY_MODEL_88c5cc8d66d8408cbe2bfedb365723f3",
3709
            "placeholder": "​",
3710
            "style": "IPY_MODEL_814bac58a4974f70b17b5e19f88b042f",
3711
            "value": "Your token has been saved to /root/.cache/huggingface/token"
3712
          }
3713
        },
3714
        "1440bf6528a844f399aea3997b0348ba": {
3715
          "model_module": "@jupyter-widgets/controls",
3716
          "model_name": "LabelModel",
3717
          "model_module_version": "1.5.0",
3718
          "state": {
3719
            "_dom_classes": [],
3720
            "_model_module": "@jupyter-widgets/controls",
3721
            "_model_module_version": "1.5.0",
3722
            "_model_name": "LabelModel",
3723
            "_view_count": null,
3724
            "_view_module": "@jupyter-widgets/controls",
3725
            "_view_module_version": "1.5.0",
3726
            "_view_name": "LabelView",
3727
            "description": "",
3728
            "description_tooltip": null,
3729
            "layout": "IPY_MODEL_3502bced8abc4cfc87300881857c4e08",
3730
            "placeholder": "​",
3731
            "style": "IPY_MODEL_c726307cdc3c4598ad45879f3f29e60c",
3732
            "value": "Login successful"
3733
          }
3734
        },
3735
        "60af265316074adab78687ac53070910": {
3736
          "model_module": "@jupyter-widgets/base",
3737
          "model_name": "LayoutModel",
3738
          "model_module_version": "1.2.0",
3739
          "state": {
3740
            "_model_module": "@jupyter-widgets/base",
3741
            "_model_module_version": "1.2.0",
3742
            "_model_name": "LayoutModel",
3743
            "_view_count": null,
3744
            "_view_module": "@jupyter-widgets/base",
3745
            "_view_module_version": "1.2.0",
3746
            "_view_name": "LayoutView",
3747
            "align_content": null,
3748
            "align_items": null,
3749
            "align_self": null,
3750
            "border": null,
3751
            "bottom": null,
3752
            "display": null,
3753
            "flex": null,
3754
            "flex_flow": null,
3755
            "grid_area": null,
3756
            "grid_auto_columns": null,
3757
            "grid_auto_flow": null,
3758
            "grid_auto_rows": null,
3759
            "grid_column": null,
3760
            "grid_gap": null,
3761
            "grid_row": null,
3762
            "grid_template_areas": null,
3763
            "grid_template_columns": null,
3764
            "grid_template_rows": null,
3765
            "height": null,
3766
            "justify_content": null,
3767
            "justify_items": null,
3768
            "left": null,
3769
            "margin": null,
3770
            "max_height": null,
3771
            "max_width": null,
3772
            "min_height": null,
3773
            "min_width": null,
3774
            "object_fit": null,
3775
            "object_position": null,
3776
            "order": null,
3777
            "overflow": null,
3778
            "overflow_x": null,
3779
            "overflow_y": null,
3780
            "padding": null,
3781
            "right": null,
3782
            "top": null,
3783
            "visibility": null,
3784
            "width": null
3785
          }
3786
        },
3787
        "1c9d8afeb2644c65909f6e689e1af0af": {
3788
          "model_module": "@jupyter-widgets/controls",
3789
          "model_name": "DescriptionStyleModel",
3790
          "model_module_version": "1.5.0",
3791
          "state": {
3792
            "_model_module": "@jupyter-widgets/controls",
3793
            "_model_module_version": "1.5.0",
3794
            "_model_name": "DescriptionStyleModel",
3795
            "_view_count": null,
3796
            "_view_module": "@jupyter-widgets/base",
3797
            "_view_module_version": "1.2.0",
3798
            "_view_name": "StyleView",
3799
            "description_width": ""
3800
          }
3801
        },
3802
        "06d7ce85d9784f58add0583feda74530": {
3803
          "model_module": "@jupyter-widgets/base",
3804
          "model_name": "LayoutModel",
3805
          "model_module_version": "1.2.0",
3806
          "state": {
3807
            "_model_module": "@jupyter-widgets/base",
3808
            "_model_module_version": "1.2.0",
3809
            "_model_name": "LayoutModel",
3810
            "_view_count": null,
3811
            "_view_module": "@jupyter-widgets/base",
3812
            "_view_module_version": "1.2.0",
3813
            "_view_name": "LayoutView",
3814
            "align_content": null,
3815
            "align_items": null,
3816
            "align_self": null,
3817
            "border": null,
3818
            "bottom": null,
3819
            "display": null,
3820
            "flex": null,
3821
            "flex_flow": null,
3822
            "grid_area": null,
3823
            "grid_auto_columns": null,
3824
            "grid_auto_flow": null,
3825
            "grid_auto_rows": null,
3826
            "grid_column": null,
3827
            "grid_gap": null,
3828
            "grid_row": null,
3829
            "grid_template_areas": null,
3830
            "grid_template_columns": null,
3831
            "grid_template_rows": null,
3832
            "height": null,
3833
            "justify_content": null,
3834
            "justify_items": null,
3835
            "left": null,
3836
            "margin": null,
3837
            "max_height": null,
3838
            "max_width": null,
3839
            "min_height": null,
3840
            "min_width": null,
3841
            "object_fit": null,
3842
            "object_position": null,
3843
            "order": null,
3844
            "overflow": null,
3845
            "overflow_x": null,
3846
            "overflow_y": null,
3847
            "padding": null,
3848
            "right": null,
3849
            "top": null,
3850
            "visibility": null,
3851
            "width": null
3852
          }
3853
        },
3854
        "bcacfb2e6c464423b5e8bc0aef675fdd": {
3855
          "model_module": "@jupyter-widgets/controls",
3856
          "model_name": "DescriptionStyleModel",
3857
          "model_module_version": "1.5.0",
3858
          "state": {
3859
            "_model_module": "@jupyter-widgets/controls",
3860
            "_model_module_version": "1.5.0",
3861
            "_model_name": "DescriptionStyleModel",
3862
            "_view_count": null,
3863
            "_view_module": "@jupyter-widgets/base",
3864
            "_view_module_version": "1.2.0",
3865
            "_view_name": "StyleView",
3866
            "description_width": ""
3867
          }
3868
        },
3869
        "88c5cc8d66d8408cbe2bfedb365723f3": {
3870
          "model_module": "@jupyter-widgets/base",
3871
          "model_name": "LayoutModel",
3872
          "model_module_version": "1.2.0",
3873
          "state": {
3874
            "_model_module": "@jupyter-widgets/base",
3875
            "_model_module_version": "1.2.0",
3876
            "_model_name": "LayoutModel",
3877
            "_view_count": null,
3878
            "_view_module": "@jupyter-widgets/base",
3879
            "_view_module_version": "1.2.0",
3880
            "_view_name": "LayoutView",
3881
            "align_content": null,
3882
            "align_items": null,
3883
            "align_self": null,
3884
            "border": null,
3885
            "bottom": null,
3886
            "display": null,
3887
            "flex": null,
3888
            "flex_flow": null,
3889
            "grid_area": null,
3890
            "grid_auto_columns": null,
3891
            "grid_auto_flow": null,
3892
            "grid_auto_rows": null,
3893
            "grid_column": null,
3894
            "grid_gap": null,
3895
            "grid_row": null,
3896
            "grid_template_areas": null,
3897
            "grid_template_columns": null,
3898
            "grid_template_rows": null,
3899
            "height": null,
3900
            "justify_content": null,
3901
            "justify_items": null,
3902
            "left": null,
3903
            "margin": null,
3904
            "max_height": null,
3905
            "max_width": null,
3906
            "min_height": null,
3907
            "min_width": null,
3908
            "object_fit": null,
3909
            "object_position": null,
3910
            "order": null,
3911
            "overflow": null,
3912
            "overflow_x": null,
3913
            "overflow_y": null,
3914
            "padding": null,
3915
            "right": null,
3916
            "top": null,
3917
            "visibility": null,
3918
            "width": null
3919
          }
3920
        },
3921
        "814bac58a4974f70b17b5e19f88b042f": {
3922
          "model_module": "@jupyter-widgets/controls",
3923
          "model_name": "DescriptionStyleModel",
3924
          "model_module_version": "1.5.0",
3925
          "state": {
3926
            "_model_module": "@jupyter-widgets/controls",
3927
            "_model_module_version": "1.5.0",
3928
            "_model_name": "DescriptionStyleModel",
3929
            "_view_count": null,
3930
            "_view_module": "@jupyter-widgets/base",
3931
            "_view_module_version": "1.2.0",
3932
            "_view_name": "StyleView",
3933
            "description_width": ""
3934
          }
3935
        },
3936
        "3502bced8abc4cfc87300881857c4e08": {
3937
          "model_module": "@jupyter-widgets/base",
3938
          "model_name": "LayoutModel",
3939
          "model_module_version": "1.2.0",
3940
          "state": {
3941
            "_model_module": "@jupyter-widgets/base",
3942
            "_model_module_version": "1.2.0",
3943
            "_model_name": "LayoutModel",
3944
            "_view_count": null,
3945
            "_view_module": "@jupyter-widgets/base",
3946
            "_view_module_version": "1.2.0",
3947
            "_view_name": "LayoutView",
3948
            "align_content": null,
3949
            "align_items": null,
3950
            "align_self": null,
3951
            "border": null,
3952
            "bottom": null,
3953
            "display": null,
3954
            "flex": null,
3955
            "flex_flow": null,
3956
            "grid_area": null,
3957
            "grid_auto_columns": null,
3958
            "grid_auto_flow": null,
3959
            "grid_auto_rows": null,
3960
            "grid_column": null,
3961
            "grid_gap": null,
3962
            "grid_row": null,
3963
            "grid_template_areas": null,
3964
            "grid_template_columns": null,
3965
            "grid_template_rows": null,
3966
            "height": null,
3967
            "justify_content": null,
3968
            "justify_items": null,
3969
            "left": null,
3970
            "margin": null,
3971
            "max_height": null,
3972
            "max_width": null,
3973
            "min_height": null,
3974
            "min_width": null,
3975
            "object_fit": null,
3976
            "object_position": null,
3977
            "order": null,
3978
            "overflow": null,
3979
            "overflow_x": null,
3980
            "overflow_y": null,
3981
            "padding": null,
3982
            "right": null,
3983
            "top": null,
3984
            "visibility": null,
3985
            "width": null
3986
          }
3987
        },
3988
        "c726307cdc3c4598ad45879f3f29e60c": {
3989
          "model_module": "@jupyter-widgets/controls",
3990
          "model_name": "DescriptionStyleModel",
3991
          "model_module_version": "1.5.0",
3992
          "state": {
3993
            "_model_module": "@jupyter-widgets/controls",
3994
            "_model_module_version": "1.5.0",
3995
            "_model_name": "DescriptionStyleModel",
3996
            "_view_count": null,
3997
            "_view_module": "@jupyter-widgets/base",
3998
            "_view_module_version": "1.2.0",
3999
            "_view_name": "StyleView",
4000
            "description_width": ""
4001
          }
4002
        },
4003
        "ee3793650a24458c8f1c9da6f6cf7930": {
4004
          "model_module": "@jupyter-widgets/controls",
4005
          "model_name": "HBoxModel",
4006
          "model_module_version": "1.5.0",
4007
          "state": {
4008
            "_dom_classes": [],
4009
            "_model_module": "@jupyter-widgets/controls",
4010
            "_model_module_version": "1.5.0",
4011
            "_model_name": "HBoxModel",
4012
            "_view_count": null,
4013
            "_view_module": "@jupyter-widgets/controls",
4014
            "_view_module_version": "1.5.0",
4015
            "_view_name": "HBoxView",
4016
            "box_style": "",
4017
            "children": [
4018
              "IPY_MODEL_db88e2bb13fa425aaccc2f7a32f2a946",
4019
              "IPY_MODEL_9f1b94961d43444697b621f5f2a80392",
4020
              "IPY_MODEL_bfa4594314d6437994f2cb57311d97a6"
4021
            ],
4022
            "layout": "IPY_MODEL_dd13edfc70174149b25a15b0858ba61c"
4023
          }
4024
        },
4025
        "db88e2bb13fa425aaccc2f7a32f2a946": {
4026
          "model_module": "@jupyter-widgets/controls",
4027
          "model_name": "HTMLModel",
4028
          "model_module_version": "1.5.0",
4029
          "state": {
4030
            "_dom_classes": [],
4031
            "_model_module": "@jupyter-widgets/controls",
4032
            "_model_module_version": "1.5.0",
4033
            "_model_name": "HTMLModel",
4034
            "_view_count": null,
4035
            "_view_module": "@jupyter-widgets/controls",
4036
            "_view_module_version": "1.5.0",
4037
            "_view_name": "HTMLView",
4038
            "description": "",
4039
            "description_tooltip": null,
4040
            "layout": "IPY_MODEL_2e0685af66bb4e52b72b8e0159df3531",
4041
            "placeholder": "​",
4042
            "style": "IPY_MODEL_0d86661bee2d497fa856892c6b6f3f46",
4043
            "value": "Downloading (…)lve/main/config.json: 100%"
4044
          }
4045
        },
4046
        "9f1b94961d43444697b621f5f2a80392": {
4047
          "model_module": "@jupyter-widgets/controls",
4048
          "model_name": "FloatProgressModel",
4049
          "model_module_version": "1.5.0",
4050
          "state": {
4051
            "_dom_classes": [],
4052
            "_model_module": "@jupyter-widgets/controls",
4053
            "_model_module_version": "1.5.0",
4054
            "_model_name": "FloatProgressModel",
4055
            "_view_count": null,
4056
            "_view_module": "@jupyter-widgets/controls",
4057
            "_view_module_version": "1.5.0",
4058
            "_view_name": "ProgressView",
4059
            "bar_style": "success",
4060
            "description": "",
4061
            "description_tooltip": null,
4062
            "layout": "IPY_MODEL_94916f236b0d4e8a8733871e84df1147",
4063
            "max": 880,
4064
            "min": 0,
4065
            "orientation": "horizontal",
4066
            "style": "IPY_MODEL_97d6e28ba91e45cd899719bb5bc2b6ab",
4067
            "value": 880
4068
          }
4069
        },
4070
        "bfa4594314d6437994f2cb57311d97a6": {
4071
          "model_module": "@jupyter-widgets/controls",
4072
          "model_name": "HTMLModel",
4073
          "model_module_version": "1.5.0",
4074
          "state": {
4075
            "_dom_classes": [],
4076
            "_model_module": "@jupyter-widgets/controls",
4077
            "_model_module_version": "1.5.0",
4078
            "_model_name": "HTMLModel",
4079
            "_view_count": null,
4080
            "_view_module": "@jupyter-widgets/controls",
4081
            "_view_module_version": "1.5.0",
4082
            "_view_name": "HTMLView",
4083
            "description": "",
4084
            "description_tooltip": null,
4085
            "layout": "IPY_MODEL_118f1b7073b847ef987036cd82499d0b",
4086
            "placeholder": "​",
4087
            "style": "IPY_MODEL_dd77325d1d8d417eb6544ae0cbc15133",
4088
            "value": " 880/880 [00:00&lt;00:00, 20.8kB/s]"
4089
          }
4090
        },
4091
        "dd13edfc70174149b25a15b0858ba61c": {
4092
          "model_module": "@jupyter-widgets/base",
4093
          "model_name": "LayoutModel",
4094
          "model_module_version": "1.2.0",
4095
          "state": {
4096
            "_model_module": "@jupyter-widgets/base",
4097
            "_model_module_version": "1.2.0",
4098
            "_model_name": "LayoutModel",
4099
            "_view_count": null,
4100
            "_view_module": "@jupyter-widgets/base",
4101
            "_view_module_version": "1.2.0",
4102
            "_view_name": "LayoutView",
4103
            "align_content": null,
4104
            "align_items": null,
4105
            "align_self": null,
4106
            "border": null,
4107
            "bottom": null,
4108
            "display": null,
4109
            "flex": null,
4110
            "flex_flow": null,
4111
            "grid_area": null,
4112
            "grid_auto_columns": null,
4113
            "grid_auto_flow": null,
4114
            "grid_auto_rows": null,
4115
            "grid_column": null,
4116
            "grid_gap": null,
4117
            "grid_row": null,
4118
            "grid_template_areas": null,
4119
            "grid_template_columns": null,
4120
            "grid_template_rows": null,
4121
            "height": null,
4122
            "justify_content": null,
4123
            "justify_items": null,
4124
            "left": null,
4125
            "margin": null,
4126
            "max_height": null,
4127
            "max_width": null,
4128
            "min_height": null,
4129
            "min_width": null,
4130
            "object_fit": null,
4131
            "object_position": null,
4132
            "order": null,
4133
            "overflow": null,
4134
            "overflow_x": null,
4135
            "overflow_y": null,
4136
            "padding": null,
4137
            "right": null,
4138
            "top": null,
4139
            "visibility": null,
4140
            "width": null
4141
          }
4142
        },
4143
        "2e0685af66bb4e52b72b8e0159df3531": {
4144
          "model_module": "@jupyter-widgets/base",
4145
          "model_name": "LayoutModel",
4146
          "model_module_version": "1.2.0",
4147
          "state": {
4148
            "_model_module": "@jupyter-widgets/base",
4149
            "_model_module_version": "1.2.0",
4150
            "_model_name": "LayoutModel",
4151
            "_view_count": null,
4152
            "_view_module": "@jupyter-widgets/base",
4153
            "_view_module_version": "1.2.0",
4154
            "_view_name": "LayoutView",
4155
            "align_content": null,
4156
            "align_items": null,
4157
            "align_self": null,
4158
            "border": null,
4159
            "bottom": null,
4160
            "display": null,
4161
            "flex": null,
4162
            "flex_flow": null,
4163
            "grid_area": null,
4164
            "grid_auto_columns": null,
4165
            "grid_auto_flow": null,
4166
            "grid_auto_rows": null,
4167
            "grid_column": null,
4168
            "grid_gap": null,
4169
            "grid_row": null,
4170
            "grid_template_areas": null,
4171
            "grid_template_columns": null,
4172
            "grid_template_rows": null,
4173
            "height": null,
4174
            "justify_content": null,
4175
            "justify_items": null,
4176
            "left": null,
4177
            "margin": null,
4178
            "max_height": null,
4179
            "max_width": null,
4180
            "min_height": null,
4181
            "min_width": null,
4182
            "object_fit": null,
4183
            "object_position": null,
4184
            "order": null,
4185
            "overflow": null,
4186
            "overflow_x": null,
4187
            "overflow_y": null,
4188
            "padding": null,
4189
            "right": null,
4190
            "top": null,
4191
            "visibility": null,
4192
            "width": null
4193
          }
4194
        },
4195
        "0d86661bee2d497fa856892c6b6f3f46": {
4196
          "model_module": "@jupyter-widgets/controls",
4197
          "model_name": "DescriptionStyleModel",
4198
          "model_module_version": "1.5.0",
4199
          "state": {
4200
            "_model_module": "@jupyter-widgets/controls",
4201
            "_model_module_version": "1.5.0",
4202
            "_model_name": "DescriptionStyleModel",
4203
            "_view_count": null,
4204
            "_view_module": "@jupyter-widgets/base",
4205
            "_view_module_version": "1.2.0",
4206
            "_view_name": "StyleView",
4207
            "description_width": ""
4208
          }
4209
        },
4210
        "94916f236b0d4e8a8733871e84df1147": {
4211
          "model_module": "@jupyter-widgets/base",
4212
          "model_name": "LayoutModel",
4213
          "model_module_version": "1.2.0",
4214
          "state": {
4215
            "_model_module": "@jupyter-widgets/base",
4216
            "_model_module_version": "1.2.0",
4217
            "_model_name": "LayoutModel",
4218
            "_view_count": null,
4219
            "_view_module": "@jupyter-widgets/base",
4220
            "_view_module_version": "1.2.0",
4221
            "_view_name": "LayoutView",
4222
            "align_content": null,
4223
            "align_items": null,
4224
            "align_self": null,
4225
            "border": null,
4226
            "bottom": null,
4227
            "display": null,
4228
            "flex": null,
4229
            "flex_flow": null,
4230
            "grid_area": null,
4231
            "grid_auto_columns": null,
4232
            "grid_auto_flow": null,
4233
            "grid_auto_rows": null,
4234
            "grid_column": null,
4235
            "grid_gap": null,
4236
            "grid_row": null,
4237
            "grid_template_areas": null,
4238
            "grid_template_columns": null,
4239
            "grid_template_rows": null,
4240
            "height": null,
4241
            "justify_content": null,
4242
            "justify_items": null,
4243
            "left": null,
4244
            "margin": null,
4245
            "max_height": null,
4246
            "max_width": null,
4247
            "min_height": null,
4248
            "min_width": null,
4249
            "object_fit": null,
4250
            "object_position": null,
4251
            "order": null,
4252
            "overflow": null,
4253
            "overflow_x": null,
4254
            "overflow_y": null,
4255
            "padding": null,
4256
            "right": null,
4257
            "top": null,
4258
            "visibility": null,
4259
            "width": null
4260
          }
4261
        },
4262
        "97d6e28ba91e45cd899719bb5bc2b6ab": {
4263
          "model_module": "@jupyter-widgets/controls",
4264
          "model_name": "ProgressStyleModel",
4265
          "model_module_version": "1.5.0",
4266
          "state": {
4267
            "_model_module": "@jupyter-widgets/controls",
4268
            "_model_module_version": "1.5.0",
4269
            "_model_name": "ProgressStyleModel",
4270
            "_view_count": null,
4271
            "_view_module": "@jupyter-widgets/base",
4272
            "_view_module_version": "1.2.0",
4273
            "_view_name": "StyleView",
4274
            "bar_color": null,
4275
            "description_width": ""
4276
          }
4277
        },
4278
        "118f1b7073b847ef987036cd82499d0b": {
4279
          "model_module": "@jupyter-widgets/base",
4280
          "model_name": "LayoutModel",
4281
          "model_module_version": "1.2.0",
4282
          "state": {
4283
            "_model_module": "@jupyter-widgets/base",
4284
            "_model_module_version": "1.2.0",
4285
            "_model_name": "LayoutModel",
4286
            "_view_count": null,
4287
            "_view_module": "@jupyter-widgets/base",
4288
            "_view_module_version": "1.2.0",
4289
            "_view_name": "LayoutView",
4290
            "align_content": null,
4291
            "align_items": null,
4292
            "align_self": null,
4293
            "border": null,
4294
            "bottom": null,
4295
            "display": null,
4296
            "flex": null,
4297
            "flex_flow": null,
4298
            "grid_area": null,
4299
            "grid_auto_columns": null,
4300
            "grid_auto_flow": null,
4301
            "grid_auto_rows": null,
4302
            "grid_column": null,
4303
            "grid_gap": null,
4304
            "grid_row": null,
4305
            "grid_template_areas": null,
4306
            "grid_template_columns": null,
4307
            "grid_template_rows": null,
4308
            "height": null,
4309
            "justify_content": null,
4310
            "justify_items": null,
4311
            "left": null,
4312
            "margin": null,
4313
            "max_height": null,
4314
            "max_width": null,
4315
            "min_height": null,
4316
            "min_width": null,
4317
            "object_fit": null,
4318
            "object_position": null,
4319
            "order": null,
4320
            "overflow": null,
4321
            "overflow_x": null,
4322
            "overflow_y": null,
4323
            "padding": null,
4324
            "right": null,
4325
            "top": null,
4326
            "visibility": null,
4327
            "width": null
4328
          }
4329
        },
4330
        "dd77325d1d8d417eb6544ae0cbc15133": {
4331
          "model_module": "@jupyter-widgets/controls",
4332
          "model_name": "DescriptionStyleModel",
4333
          "model_module_version": "1.5.0",
4334
          "state": {
4335
            "_model_module": "@jupyter-widgets/controls",
4336
            "_model_module_version": "1.5.0",
4337
            "_model_name": "DescriptionStyleModel",
4338
            "_view_count": null,
4339
            "_view_module": "@jupyter-widgets/base",
4340
            "_view_module_version": "1.2.0",
4341
            "_view_name": "StyleView",
4342
            "description_width": ""
4343
          }
4344
        },
4345
        "794c3466fdc34e549aaefbc106537e16": {
4346
          "model_module": "@jupyter-widgets/controls",
4347
          "model_name": "HBoxModel",
4348
          "model_module_version": "1.5.0",
4349
          "state": {
4350
            "_dom_classes": [],
4351
            "_model_module": "@jupyter-widgets/controls",
4352
            "_model_module_version": "1.5.0",
4353
            "_model_name": "HBoxModel",
4354
            "_view_count": null,
4355
            "_view_module": "@jupyter-widgets/controls",
4356
            "_view_module_version": "1.5.0",
4357
            "_view_name": "HBoxView",
4358
            "box_style": "",
4359
            "children": [
4360
              "IPY_MODEL_cb4a5c788e9d44818ff61e2551ed750e",
4361
              "IPY_MODEL_fec4fa9c00d6429791bceeccc053bc05",
4362
              "IPY_MODEL_fef1d4090bcf4d77895d45567bb1ff41"
4363
            ],
4364
            "layout": "IPY_MODEL_06a0a6459ff14187acac58481400bf05"
4365
          }
4366
        },
4367
        "cb4a5c788e9d44818ff61e2551ed750e": {
4368
          "model_module": "@jupyter-widgets/controls",
4369
          "model_name": "HTMLModel",
4370
          "model_module_version": "1.5.0",
4371
          "state": {
4372
            "_dom_classes": [],
4373
            "_model_module": "@jupyter-widgets/controls",
4374
            "_model_module_version": "1.5.0",
4375
            "_model_name": "HTMLModel",
4376
            "_view_count": null,
4377
            "_view_module": "@jupyter-widgets/controls",
4378
            "_view_module_version": "1.5.0",
4379
            "_view_name": "HTMLView",
4380
            "description": "",
4381
            "description_tooltip": null,
4382
            "layout": "IPY_MODEL_6caf5b09e0f44382807c41193a2963d3",
4383
            "placeholder": "​",
4384
            "style": "IPY_MODEL_6c95ad4f7ae24185a3fa9dbf9f8f68a2",
4385
            "value": "Downloading (…)former_sequential.py: 100%"
4386
          }
4387
        },
4388
        "fec4fa9c00d6429791bceeccc053bc05": {
4389
          "model_module": "@jupyter-widgets/controls",
4390
          "model_name": "FloatProgressModel",
4391
          "model_module_version": "1.5.0",
4392
          "state": {
4393
            "_dom_classes": [],
4394
            "_model_module": "@jupyter-widgets/controls",
4395
            "_model_module_version": "1.5.0",
4396
            "_model_name": "FloatProgressModel",
4397
            "_view_count": null,
4398
            "_view_module": "@jupyter-widgets/controls",
4399
            "_view_module_version": "1.5.0",
4400
            "_view_name": "ProgressView",
4401
            "bar_style": "success",
4402
            "description": "",
4403
            "description_tooltip": null,
4404
            "layout": "IPY_MODEL_69b2fdbe3a5e4682963987fb914afec5",
4405
            "max": 2235,
4406
            "min": 0,
4407
            "orientation": "horizontal",
4408
            "style": "IPY_MODEL_38e5964aa7a744439c7e5ad26c162ead",
4409
            "value": 2235
4410
          }
4411
        },
4412
        "fef1d4090bcf4d77895d45567bb1ff41": {
4413
          "model_module": "@jupyter-widgets/controls",
4414
          "model_name": "HTMLModel",
4415
          "model_module_version": "1.5.0",
4416
          "state": {
4417
            "_dom_classes": [],
4418
            "_model_module": "@jupyter-widgets/controls",
4419
            "_model_module_version": "1.5.0",
4420
            "_model_name": "HTMLModel",
4421
            "_view_count": null,
4422
            "_view_module": "@jupyter-widgets/controls",
4423
            "_view_module_version": "1.5.0",
4424
            "_view_name": "HTMLView",
4425
            "description": "",
4426
            "description_tooltip": null,
4427
            "layout": "IPY_MODEL_8f1d717eba6942b8aca16cbc49bc6a6f",
4428
            "placeholder": "​",
4429
            "style": "IPY_MODEL_0168b508956141269412e88990ee3d67",
4430
            "value": " 2.23k/2.23k [00:00&lt;00:00, 124kB/s]"
4431
          }
4432
        },
4433
        "06a0a6459ff14187acac58481400bf05": {
4434
          "model_module": "@jupyter-widgets/base",
4435
          "model_name": "LayoutModel",
4436
          "model_module_version": "1.2.0",
4437
          "state": {
4438
            "_model_module": "@jupyter-widgets/base",
4439
            "_model_module_version": "1.2.0",
4440
            "_model_name": "LayoutModel",
4441
            "_view_count": null,
4442
            "_view_module": "@jupyter-widgets/base",
4443
            "_view_module_version": "1.2.0",
4444
            "_view_name": "LayoutView",
4445
            "align_content": null,
4446
            "align_items": null,
4447
            "align_self": null,
4448
            "border": null,
4449
            "bottom": null,
4450
            "display": null,
4451
            "flex": null,
4452
            "flex_flow": null,
4453
            "grid_area": null,
4454
            "grid_auto_columns": null,
4455
            "grid_auto_flow": null,
4456
            "grid_auto_rows": null,
4457
            "grid_column": null,
4458
            "grid_gap": null,
4459
            "grid_row": null,
4460
            "grid_template_areas": null,
4461
            "grid_template_columns": null,
4462
            "grid_template_rows": null,
4463
            "height": null,
4464
            "justify_content": null,
4465
            "justify_items": null,
4466
            "left": null,
4467
            "margin": null,
4468
            "max_height": null,
4469
            "max_width": null,
4470
            "min_height": null,
4471
            "min_width": null,
4472
            "object_fit": null,
4473
            "object_position": null,
4474
            "order": null,
4475
            "overflow": null,
4476
            "overflow_x": null,
4477
            "overflow_y": null,
4478
            "padding": null,
4479
            "right": null,
4480
            "top": null,
4481
            "visibility": null,
4482
            "width": null
4483
          }
4484
        },
4485
        "6caf5b09e0f44382807c41193a2963d3": {
4486
          "model_module": "@jupyter-widgets/base",
4487
          "model_name": "LayoutModel",
4488
          "model_module_version": "1.2.0",
4489
          "state": {
4490
            "_model_module": "@jupyter-widgets/base",
4491
            "_model_module_version": "1.2.0",
4492
            "_model_name": "LayoutModel",
4493
            "_view_count": null,
4494
            "_view_module": "@jupyter-widgets/base",
4495
            "_view_module_version": "1.2.0",
4496
            "_view_name": "LayoutView",
4497
            "align_content": null,
4498
            "align_items": null,
4499
            "align_self": null,
4500
            "border": null,
4501
            "bottom": null,
4502
            "display": null,
4503
            "flex": null,
4504
            "flex_flow": null,
4505
            "grid_area": null,
4506
            "grid_auto_columns": null,
4507
            "grid_auto_flow": null,
4508
            "grid_auto_rows": null,
4509
            "grid_column": null,
4510
            "grid_gap": null,
4511
            "grid_row": null,
4512
            "grid_template_areas": null,
4513
            "grid_template_columns": null,
4514
            "grid_template_rows": null,
4515
            "height": null,
4516
            "justify_content": null,
4517
            "justify_items": null,
4518
            "left": null,
4519
            "margin": null,
4520
            "max_height": null,
4521
            "max_width": null,
4522
            "min_height": null,
4523
            "min_width": null,
4524
            "object_fit": null,
4525
            "object_position": null,
4526
            "order": null,
4527
            "overflow": null,
4528
            "overflow_x": null,
4529
            "overflow_y": null,
4530
            "padding": null,
4531
            "right": null,
4532
            "top": null,
4533
            "visibility": null,
4534
            "width": null
4535
          }
4536
        },
4537
        "6c95ad4f7ae24185a3fa9dbf9f8f68a2": {
4538
          "model_module": "@jupyter-widgets/controls",
4539
          "model_name": "DescriptionStyleModel",
4540
          "model_module_version": "1.5.0",
4541
          "state": {
4542
            "_model_module": "@jupyter-widgets/controls",
4543
            "_model_module_version": "1.5.0",
4544
            "_model_name": "DescriptionStyleModel",
4545
            "_view_count": null,
4546
            "_view_module": "@jupyter-widgets/base",
4547
            "_view_module_version": "1.2.0",
4548
            "_view_name": "StyleView",
4549
            "description_width": ""
4550
          }
4551
        },
4552
        "69b2fdbe3a5e4682963987fb914afec5": {
4553
          "model_module": "@jupyter-widgets/base",
4554
          "model_name": "LayoutModel",
4555
          "model_module_version": "1.2.0",
4556
          "state": {
4557
            "_model_module": "@jupyter-widgets/base",
4558
            "_model_module_version": "1.2.0",
4559
            "_model_name": "LayoutModel",
4560
            "_view_count": null,
4561
            "_view_module": "@jupyter-widgets/base",
4562
            "_view_module_version": "1.2.0",
4563
            "_view_name": "LayoutView",
4564
            "align_content": null,
4565
            "align_items": null,
4566
            "align_self": null,
4567
            "border": null,
4568
            "bottom": null,
4569
            "display": null,
4570
            "flex": null,
4571
            "flex_flow": null,
4572
            "grid_area": null,
4573
            "grid_auto_columns": null,
4574
            "grid_auto_flow": null,
4575
            "grid_auto_rows": null,
4576
            "grid_column": null,
4577
            "grid_gap": null,
4578
            "grid_row": null,
4579
            "grid_template_areas": null,
4580
            "grid_template_columns": null,
4581
            "grid_template_rows": null,
4582
            "height": null,
4583
            "justify_content": null,
4584
            "justify_items": null,
4585
            "left": null,
4586
            "margin": null,
4587
            "max_height": null,
4588
            "max_width": null,
4589
            "min_height": null,
4590
            "min_width": null,
4591
            "object_fit": null,
4592
            "object_position": null,
4593
            "order": null,
4594
            "overflow": null,
4595
            "overflow_x": null,
4596
            "overflow_y": null,
4597
            "padding": null,
4598
            "right": null,
4599
            "top": null,
4600
            "visibility": null,
4601
            "width": null
4602
          }
4603
        },
4604
        "38e5964aa7a744439c7e5ad26c162ead": {
4605
          "model_module": "@jupyter-widgets/controls",
4606
          "model_name": "ProgressStyleModel",
4607
          "model_module_version": "1.5.0",
4608
          "state": {
4609
            "_model_module": "@jupyter-widgets/controls",
4610
            "_model_module_version": "1.5.0",
4611
            "_model_name": "ProgressStyleModel",
4612
            "_view_count": null,
4613
            "_view_module": "@jupyter-widgets/base",
4614
            "_view_module_version": "1.2.0",
4615
            "_view_name": "StyleView",
4616
            "bar_color": null,
4617
            "description_width": ""
4618
          }
4619
        },
4620
        "8f1d717eba6942b8aca16cbc49bc6a6f": {
4621
          "model_module": "@jupyter-widgets/base",
4622
          "model_name": "LayoutModel",
4623
          "model_module_version": "1.2.0",
4624
          "state": {
4625
            "_model_module": "@jupyter-widgets/base",
4626
            "_model_module_version": "1.2.0",
4627
            "_model_name": "LayoutModel",
4628
            "_view_count": null,
4629
            "_view_module": "@jupyter-widgets/base",
4630
            "_view_module_version": "1.2.0",
4631
            "_view_name": "LayoutView",
4632
            "align_content": null,
4633
            "align_items": null,
4634
            "align_self": null,
4635
            "border": null,
4636
            "bottom": null,
4637
            "display": null,
4638
            "flex": null,
4639
            "flex_flow": null,
4640
            "grid_area": null,
4641
            "grid_auto_columns": null,
4642
            "grid_auto_flow": null,
4643
            "grid_auto_rows": null,
4644
            "grid_column": null,
4645
            "grid_gap": null,
4646
            "grid_row": null,
4647
            "grid_template_areas": null,
4648
            "grid_template_columns": null,
4649
            "grid_template_rows": null,
4650
            "height": null,
4651
            "justify_content": null,
4652
            "justify_items": null,
4653
            "left": null,
4654
            "margin": null,
4655
            "max_height": null,
4656
            "max_width": null,
4657
            "min_height": null,
4658
            "min_width": null,
4659
            "object_fit": null,
4660
            "object_position": null,
4661
            "order": null,
4662
            "overflow": null,
4663
            "overflow_x": null,
4664
            "overflow_y": null,
4665
            "padding": null,
4666
            "right": null,
4667
            "top": null,
4668
            "visibility": null,
4669
            "width": null
4670
          }
4671
        },
4672
        "0168b508956141269412e88990ee3d67": {
4673
          "model_module": "@jupyter-widgets/controls",
4674
          "model_name": "DescriptionStyleModel",
4675
          "model_module_version": "1.5.0",
4676
          "state": {
4677
            "_model_module": "@jupyter-widgets/controls",
4678
            "_model_module_version": "1.5.0",
4679
            "_model_name": "DescriptionStyleModel",
4680
            "_view_count": null,
4681
            "_view_module": "@jupyter-widgets/base",
4682
            "_view_module_version": "1.2.0",
4683
            "_view_name": "StyleView",
4684
            "description_width": ""
4685
          }
4686
        },
4687
        "e8b48f5b7e2b4d8d9407cb667092a3e8": {
4688
          "model_module": "@jupyter-widgets/controls",
4689
          "model_name": "HBoxModel",
4690
          "model_module_version": "1.5.0",
4691
          "state": {
4692
            "_dom_classes": [],
4693
            "_model_module": "@jupyter-widgets/controls",
4694
            "_model_module_version": "1.5.0",
4695
            "_model_name": "HBoxModel",
4696
            "_view_count": null,
4697
            "_view_module": "@jupyter-widgets/controls",
4698
            "_view_module_version": "1.5.0",
4699
            "_view_name": "HBoxView",
4700
            "box_style": "",
4701
            "children": [
4702
              "IPY_MODEL_8b1317e6869e439092c1d880137f62fd",
4703
              "IPY_MODEL_72a199e2dc1b4d63984493e6bf1bdb8c",
4704
              "IPY_MODEL_2296ca45af0c4cec80d01fb7e33f278f"
4705
            ],
4706
            "layout": "IPY_MODEL_3dd72eb426fa4e6e919276bb4e91f60f"
4707
          }
4708
        },
4709
        "8b1317e6869e439092c1d880137f62fd": {
4710
          "model_module": "@jupyter-widgets/controls",
4711
          "model_name": "HTMLModel",
4712
          "model_module_version": "1.5.0",
4713
          "state": {
4714
            "_dom_classes": [],
4715
            "_model_module": "@jupyter-widgets/controls",
4716
            "_model_module_version": "1.5.0",
4717
            "_model_name": "HTMLModel",
4718
            "_view_count": null,
4719
            "_view_module": "@jupyter-widgets/controls",
4720
            "_view_module_version": "1.5.0",
4721
            "_view_name": "HTMLView",
4722
            "description": "",
4723
            "description_tooltip": null,
4724
            "layout": "IPY_MODEL_2d01ed4a650c4bcf9d07f020ae98081d",
4725
            "placeholder": "​",
4726
            "style": "IPY_MODEL_51ac6641cd1441998abadc1993d4ef96",
4727
            "value": "Downloading (…)former_sequential.py: 100%"
4728
          }
4729
        },
4730
        "72a199e2dc1b4d63984493e6bf1bdb8c": {
4731
          "model_module": "@jupyter-widgets/controls",
4732
          "model_name": "FloatProgressModel",
4733
          "model_module_version": "1.5.0",
4734
          "state": {
4735
            "_dom_classes": [],
4736
            "_model_module": "@jupyter-widgets/controls",
4737
            "_model_module_version": "1.5.0",
4738
            "_model_name": "FloatProgressModel",
4739
            "_view_count": null,
4740
            "_view_module": "@jupyter-widgets/controls",
4741
            "_view_module_version": "1.5.0",
4742
            "_view_name": "ProgressView",
4743
            "bar_style": "success",
4744
            "description": "",
4745
            "description_tooltip": null,
4746
            "layout": "IPY_MODEL_520db9e6803d48fca60b1063e10cf260",
4747
            "max": 32240,
4748
            "min": 0,
4749
            "orientation": "horizontal",
4750
            "style": "IPY_MODEL_677f54e2735f407088724a38212c0171",
4751
            "value": 32240
4752
          }
4753
        },
4754
        "2296ca45af0c4cec80d01fb7e33f278f": {
4755
          "model_module": "@jupyter-widgets/controls",
4756
          "model_name": "HTMLModel",
4757
          "model_module_version": "1.5.0",
4758
          "state": {
4759
            "_dom_classes": [],
4760
            "_model_module": "@jupyter-widgets/controls",
4761
            "_model_module_version": "1.5.0",
4762
            "_model_name": "HTMLModel",
4763
            "_view_count": null,
4764
            "_view_module": "@jupyter-widgets/controls",
4765
            "_view_module_version": "1.5.0",
4766
            "_view_name": "HTMLView",
4767
            "description": "",
4768
            "description_tooltip": null,
4769
            "layout": "IPY_MODEL_49fd03a8e4954f5caf410898882324c8",
4770
            "placeholder": "​",
4771
            "style": "IPY_MODEL_63e68a09d85a4afd90d125bc61983d7a",
4772
            "value": " 32.2k/32.2k [00:00&lt;00:00, 951kB/s]"
4773
          }
4774
        },
4775
        "3dd72eb426fa4e6e919276bb4e91f60f": {
4776
          "model_module": "@jupyter-widgets/base",
4777
          "model_name": "LayoutModel",
4778
          "model_module_version": "1.2.0",
4779
          "state": {
4780
            "_model_module": "@jupyter-widgets/base",
4781
            "_model_module_version": "1.2.0",
4782
            "_model_name": "LayoutModel",
4783
            "_view_count": null,
4784
            "_view_module": "@jupyter-widgets/base",
4785
            "_view_module_version": "1.2.0",
4786
            "_view_name": "LayoutView",
4787
            "align_content": null,
4788
            "align_items": null,
4789
            "align_self": null,
4790
            "border": null,
4791
            "bottom": null,
4792
            "display": null,
4793
            "flex": null,
4794
            "flex_flow": null,
4795
            "grid_area": null,
4796
            "grid_auto_columns": null,
4797
            "grid_auto_flow": null,
4798
            "grid_auto_rows": null,
4799
            "grid_column": null,
4800
            "grid_gap": null,
4801
            "grid_row": null,
4802
            "grid_template_areas": null,
4803
            "grid_template_columns": null,
4804
            "grid_template_rows": null,
4805
            "height": null,
4806
            "justify_content": null,
4807
            "justify_items": null,
4808
            "left": null,
4809
            "margin": null,
4810
            "max_height": null,
4811
            "max_width": null,
4812
            "min_height": null,
4813
            "min_width": null,
4814
            "object_fit": null,
4815
            "object_position": null,
4816
            "order": null,
4817
            "overflow": null,
4818
            "overflow_x": null,
4819
            "overflow_y": null,
4820
            "padding": null,
4821
            "right": null,
4822
            "top": null,
4823
            "visibility": null,
4824
            "width": null
4825
          }
4826
        },
4827
        "2d01ed4a650c4bcf9d07f020ae98081d": {
4828
          "model_module": "@jupyter-widgets/base",
4829
          "model_name": "LayoutModel",
4830
          "model_module_version": "1.2.0",
4831
          "state": {
4832
            "_model_module": "@jupyter-widgets/base",
4833
            "_model_module_version": "1.2.0",
4834
            "_model_name": "LayoutModel",
4835
            "_view_count": null,
4836
            "_view_module": "@jupyter-widgets/base",
4837
            "_view_module_version": "1.2.0",
4838
            "_view_name": "LayoutView",
4839
            "align_content": null,
4840
            "align_items": null,
4841
            "align_self": null,
4842
            "border": null,
4843
            "bottom": null,
4844
            "display": null,
4845
            "flex": null,
4846
            "flex_flow": null,
4847
            "grid_area": null,
4848
            "grid_auto_columns": null,
4849
            "grid_auto_flow": null,
4850
            "grid_auto_rows": null,
4851
            "grid_column": null,
4852
            "grid_gap": null,
4853
            "grid_row": null,
4854
            "grid_template_areas": null,
4855
            "grid_template_columns": null,
4856
            "grid_template_rows": null,
4857
            "height": null,
4858
            "justify_content": null,
4859
            "justify_items": null,
4860
            "left": null,
4861
            "margin": null,
4862
            "max_height": null,
4863
            "max_width": null,
4864
            "min_height": null,
4865
            "min_width": null,
4866
            "object_fit": null,
4867
            "object_position": null,
4868
            "order": null,
4869
            "overflow": null,
4870
            "overflow_x": null,
4871
            "overflow_y": null,
4872
            "padding": null,
4873
            "right": null,
4874
            "top": null,
4875
            "visibility": null,
4876
            "width": null
4877
          }
4878
        },
4879
        "51ac6641cd1441998abadc1993d4ef96": {
4880
          "model_module": "@jupyter-widgets/controls",
4881
          "model_name": "DescriptionStyleModel",
4882
          "model_module_version": "1.5.0",
4883
          "state": {
4884
            "_model_module": "@jupyter-widgets/controls",
4885
            "_model_module_version": "1.5.0",
4886
            "_model_name": "DescriptionStyleModel",
4887
            "_view_count": null,
4888
            "_view_module": "@jupyter-widgets/base",
4889
            "_view_module_version": "1.2.0",
4890
            "_view_name": "StyleView",
4891
            "description_width": ""
4892
          }
4893
        },
4894
        "520db9e6803d48fca60b1063e10cf260": {
4895
          "model_module": "@jupyter-widgets/base",
4896
          "model_name": "LayoutModel",
4897
          "model_module_version": "1.2.0",
4898
          "state": {
4899
            "_model_module": "@jupyter-widgets/base",
4900
            "_model_module_version": "1.2.0",
4901
            "_model_name": "LayoutModel",
4902
            "_view_count": null,
4903
            "_view_module": "@jupyter-widgets/base",
4904
            "_view_module_version": "1.2.0",
4905
            "_view_name": "LayoutView",
4906
            "align_content": null,
4907
            "align_items": null,
4908
            "align_self": null,
4909
            "border": null,
4910
            "bottom": null,
4911
            "display": null,
4912
            "flex": null,
4913
            "flex_flow": null,
4914
            "grid_area": null,
4915
            "grid_auto_columns": null,
4916
            "grid_auto_flow": null,
4917
            "grid_auto_rows": null,
4918
            "grid_column": null,
4919
            "grid_gap": null,
4920
            "grid_row": null,
4921
            "grid_template_areas": null,
4922
            "grid_template_columns": null,
4923
            "grid_template_rows": null,
4924
            "height": null,
4925
            "justify_content": null,
4926
            "justify_items": null,
4927
            "left": null,
4928
            "margin": null,
4929
            "max_height": null,
4930
            "max_width": null,
4931
            "min_height": null,
4932
            "min_width": null,
4933
            "object_fit": null,
4934
            "object_position": null,
4935
            "order": null,
4936
            "overflow": null,
4937
            "overflow_x": null,
4938
            "overflow_y": null,
4939
            "padding": null,
4940
            "right": null,
4941
            "top": null,
4942
            "visibility": null,
4943
            "width": null
4944
          }
4945
        },
4946
        "677f54e2735f407088724a38212c0171": {
4947
          "model_module": "@jupyter-widgets/controls",
4948
          "model_name": "ProgressStyleModel",
4949
          "model_module_version": "1.5.0",
4950
          "state": {
4951
            "_model_module": "@jupyter-widgets/controls",
4952
            "_model_module_version": "1.5.0",
4953
            "_model_name": "ProgressStyleModel",
4954
            "_view_count": null,
4955
            "_view_module": "@jupyter-widgets/base",
4956
            "_view_module_version": "1.2.0",
4957
            "_view_name": "StyleView",
4958
            "bar_color": null,
4959
            "description_width": ""
4960
          }
4961
        },
4962
        "49fd03a8e4954f5caf410898882324c8": {
4963
          "model_module": "@jupyter-widgets/base",
4964
          "model_name": "LayoutModel",
4965
          "model_module_version": "1.2.0",
4966
          "state": {
4967
            "_model_module": "@jupyter-widgets/base",
4968
            "_model_module_version": "1.2.0",
4969
            "_model_name": "LayoutModel",
4970
            "_view_count": null,
4971
            "_view_module": "@jupyter-widgets/base",
4972
            "_view_module_version": "1.2.0",
4973
            "_view_name": "LayoutView",
4974
            "align_content": null,
4975
            "align_items": null,
4976
            "align_self": null,
4977
            "border": null,
4978
            "bottom": null,
4979
            "display": null,
4980
            "flex": null,
4981
            "flex_flow": null,
4982
            "grid_area": null,
4983
            "grid_auto_columns": null,
4984
            "grid_auto_flow": null,
4985
            "grid_auto_rows": null,
4986
            "grid_column": null,
4987
            "grid_gap": null,
4988
            "grid_row": null,
4989
            "grid_template_areas": null,
4990
            "grid_template_columns": null,
4991
            "grid_template_rows": null,
4992
            "height": null,
4993
            "justify_content": null,
4994
            "justify_items": null,
4995
            "left": null,
4996
            "margin": null,
4997
            "max_height": null,
4998
            "max_width": null,
4999
            "min_height": null,
5000
            "min_width": null,
5001
            "object_fit": null,
5002
            "object_position": null,
5003
            "order": null,
5004
            "overflow": null,
5005
            "overflow_x": null,
5006
            "overflow_y": null,
5007
            "padding": null,
5008
            "right": null,
5009
            "top": null,
5010
            "visibility": null,
5011
            "width": null
5012
          }
5013
        },
5014
        "63e68a09d85a4afd90d125bc61983d7a": {
5015
          "model_module": "@jupyter-widgets/controls",
5016
          "model_name": "DescriptionStyleModel",
5017
          "model_module_version": "1.5.0",
5018
          "state": {
5019
            "_model_module": "@jupyter-widgets/controls",
5020
            "_model_module_version": "1.5.0",
5021
            "_model_name": "DescriptionStyleModel",
5022
            "_view_count": null,
5023
            "_view_module": "@jupyter-widgets/base",
5024
            "_view_module_version": "1.2.0",
5025
            "_view_name": "StyleView",
5026
            "description_width": ""
5027
          }
5028
        },
5029
        "3672b47a27d64466995731f7475dff05": {
5030
          "model_module": "@jupyter-widgets/controls",
5031
          "model_name": "HBoxModel",
5032
          "model_module_version": "1.5.0",
5033
          "state": {
5034
            "_dom_classes": [],
5035
            "_model_module": "@jupyter-widgets/controls",
5036
            "_model_module_version": "1.5.0",
5037
            "_model_name": "HBoxModel",
5038
            "_view_count": null,
5039
            "_view_module": "@jupyter-widgets/controls",
5040
            "_view_module_version": "1.5.0",
5041
            "_view_name": "HBoxView",
5042
            "box_style": "",
5043
            "children": [
5044
              "IPY_MODEL_27905804572740018fa7c00a6de8e82d",
5045
              "IPY_MODEL_dd8375f821bd4283b3f906aea5c23d07",
5046
              "IPY_MODEL_a9f84e0028e440828def8cee6ae317ee"
5047
            ],
5048
            "layout": "IPY_MODEL_0c068bce19d74f7b835c90221a1cde38"
5049
          }
5050
        },
5051
        "27905804572740018fa7c00a6de8e82d": {
5052
          "model_module": "@jupyter-widgets/controls",
5053
          "model_name": "HTMLModel",
5054
          "model_module_version": "1.5.0",
5055
          "state": {
5056
            "_dom_classes": [],
5057
            "_model_module": "@jupyter-widgets/controls",
5058
            "_model_module_version": "1.5.0",
5059
            "_model_name": "HTMLModel",
5060
            "_view_count": null,
5061
            "_view_module": "@jupyter-widgets/controls",
5062
            "_view_module_version": "1.5.0",
5063
            "_view_name": "HTMLView",
5064
            "description": "",
5065
            "description_tooltip": null,
5066
            "layout": "IPY_MODEL_f9df8cdf043a4aaab82d55f24c17a3d8",
5067
            "placeholder": "​",
5068
            "style": "IPY_MODEL_4efaf38f2eaa46799c2afecb55ccf14c",
5069
            "value": "Downloading pytorch_model.bin: 100%"
5070
          }
5071
        },
5072
        "dd8375f821bd4283b3f906aea5c23d07": {
5073
          "model_module": "@jupyter-widgets/controls",
5074
          "model_name": "FloatProgressModel",
5075
          "model_module_version": "1.5.0",
5076
          "state": {
5077
            "_dom_classes": [],
5078
            "_model_module": "@jupyter-widgets/controls",
5079
            "_model_module_version": "1.5.0",
5080
            "_model_name": "FloatProgressModel",
5081
            "_view_count": null,
5082
            "_view_module": "@jupyter-widgets/controls",
5083
            "_view_module_version": "1.5.0",
5084
            "_view_name": "ProgressView",
5085
            "bar_style": "success",
5086
            "description": "",
5087
            "description_tooltip": null,
5088
            "layout": "IPY_MODEL_498424778ff94f7ea6e6f32e8cd95868",
5089
            "max": 2836623617,
5090
            "min": 0,
5091
            "orientation": "horizontal",
5092
            "style": "IPY_MODEL_6b654ce3193745208af00288d6f9d5f9",
5093
            "value": 2836623617
5094
          }
5095
        },
5096
        "a9f84e0028e440828def8cee6ae317ee": {
5097
          "model_module": "@jupyter-widgets/controls",
5098
          "model_name": "HTMLModel",
5099
          "model_module_version": "1.5.0",
5100
          "state": {
5101
            "_dom_classes": [],
5102
            "_model_module": "@jupyter-widgets/controls",
5103
            "_model_module_version": "1.5.0",
5104
            "_model_name": "HTMLModel",
5105
            "_view_count": null,
5106
            "_view_module": "@jupyter-widgets/controls",
5107
            "_view_module_version": "1.5.0",
5108
            "_view_name": "HTMLView",
5109
            "description": "",
5110
            "description_tooltip": null,
5111
            "layout": "IPY_MODEL_681653beca9b4a6591f7008e0ff5ac3b",
5112
            "placeholder": "​",
5113
            "style": "IPY_MODEL_997bd19e08ff48bc92a83487598be156",
5114
            "value": " 2.84G/2.84G [00:28&lt;00:00, 65.3MB/s]"
5115
          }
5116
        },
5117
        "0c068bce19d74f7b835c90221a1cde38": {
5118
          "model_module": "@jupyter-widgets/base",
5119
          "model_name": "LayoutModel",
5120
          "model_module_version": "1.2.0",
5121
          "state": {
5122
            "_model_module": "@jupyter-widgets/base",
5123
            "_model_module_version": "1.2.0",
5124
            "_model_name": "LayoutModel",
5125
            "_view_count": null,
5126
            "_view_module": "@jupyter-widgets/base",
5127
            "_view_module_version": "1.2.0",
5128
            "_view_name": "LayoutView",
5129
            "align_content": null,
5130
            "align_items": null,
5131
            "align_self": null,
5132
            "border": null,
5133
            "bottom": null,
5134
            "display": null,
5135
            "flex": null,
5136
            "flex_flow": null,
5137
            "grid_area": null,
5138
            "grid_auto_columns": null,
5139
            "grid_auto_flow": null,
5140
            "grid_auto_rows": null,
5141
            "grid_column": null,
5142
            "grid_gap": null,
5143
            "grid_row": null,
5144
            "grid_template_areas": null,
5145
            "grid_template_columns": null,
5146
            "grid_template_rows": null,
5147
            "height": null,
5148
            "justify_content": null,
5149
            "justify_items": null,
5150
            "left": null,
5151
            "margin": null,
5152
            "max_height": null,
5153
            "max_width": null,
5154
            "min_height": null,
5155
            "min_width": null,
5156
            "object_fit": null,
5157
            "object_position": null,
5158
            "order": null,
5159
            "overflow": null,
5160
            "overflow_x": null,
5161
            "overflow_y": null,
5162
            "padding": null,
5163
            "right": null,
5164
            "top": null,
5165
            "visibility": null,
5166
            "width": null
5167
          }
5168
        },
5169
        "f9df8cdf043a4aaab82d55f24c17a3d8": {
5170
          "model_module": "@jupyter-widgets/base",
5171
          "model_name": "LayoutModel",
5172
          "model_module_version": "1.2.0",
5173
          "state": {
5174
            "_model_module": "@jupyter-widgets/base",
5175
            "_model_module_version": "1.2.0",
5176
            "_model_name": "LayoutModel",
5177
            "_view_count": null,
5178
            "_view_module": "@jupyter-widgets/base",
5179
            "_view_module_version": "1.2.0",
5180
            "_view_name": "LayoutView",
5181
            "align_content": null,
5182
            "align_items": null,
5183
            "align_self": null,
5184
            "border": null,
5185
            "bottom": null,
5186
            "display": null,
5187
            "flex": null,
5188
            "flex_flow": null,
5189
            "grid_area": null,
5190
            "grid_auto_columns": null,
5191
            "grid_auto_flow": null,
5192
            "grid_auto_rows": null,
5193
            "grid_column": null,
5194
            "grid_gap": null,
5195
            "grid_row": null,
5196
            "grid_template_areas": null,
5197
            "grid_template_columns": null,
5198
            "grid_template_rows": null,
5199
            "height": null,
5200
            "justify_content": null,
5201
            "justify_items": null,
5202
            "left": null,
5203
            "margin": null,
5204
            "max_height": null,
5205
            "max_width": null,
5206
            "min_height": null,
5207
            "min_width": null,
5208
            "object_fit": null,
5209
            "object_position": null,
5210
            "order": null,
5211
            "overflow": null,
5212
            "overflow_x": null,
5213
            "overflow_y": null,
5214
            "padding": null,
5215
            "right": null,
5216
            "top": null,
5217
            "visibility": null,
5218
            "width": null
5219
          }
5220
        },
5221
        "4efaf38f2eaa46799c2afecb55ccf14c": {
5222
          "model_module": "@jupyter-widgets/controls",
5223
          "model_name": "DescriptionStyleModel",
5224
          "model_module_version": "1.5.0",
5225
          "state": {
5226
            "_model_module": "@jupyter-widgets/controls",
5227
            "_model_module_version": "1.5.0",
5228
            "_model_name": "DescriptionStyleModel",
5229
            "_view_count": null,
5230
            "_view_module": "@jupyter-widgets/base",
5231
            "_view_module_version": "1.2.0",
5232
            "_view_name": "StyleView",
5233
            "description_width": ""
5234
          }
5235
        },
5236
        "498424778ff94f7ea6e6f32e8cd95868": {
5237
          "model_module": "@jupyter-widgets/base",
5238
          "model_name": "LayoutModel",
5239
          "model_module_version": "1.2.0",
5240
          "state": {
5241
            "_model_module": "@jupyter-widgets/base",
5242
            "_model_module_version": "1.2.0",
5243
            "_model_name": "LayoutModel",
5244
            "_view_count": null,
5245
            "_view_module": "@jupyter-widgets/base",
5246
            "_view_module_version": "1.2.0",
5247
            "_view_name": "LayoutView",
5248
            "align_content": null,
5249
            "align_items": null,
5250
            "align_self": null,
5251
            "border": null,
5252
            "bottom": null,
5253
            "display": null,
5254
            "flex": null,
5255
            "flex_flow": null,
5256
            "grid_area": null,
5257
            "grid_auto_columns": null,
5258
            "grid_auto_flow": null,
5259
            "grid_auto_rows": null,
5260
            "grid_column": null,
5261
            "grid_gap": null,
5262
            "grid_row": null,
5263
            "grid_template_areas": null,
5264
            "grid_template_columns": null,
5265
            "grid_template_rows": null,
5266
            "height": null,
5267
            "justify_content": null,
5268
            "justify_items": null,
5269
            "left": null,
5270
            "margin": null,
5271
            "max_height": null,
5272
            "max_width": null,
5273
            "min_height": null,
5274
            "min_width": null,
5275
            "object_fit": null,
5276
            "object_position": null,
5277
            "order": null,
5278
            "overflow": null,
5279
            "overflow_x": null,
5280
            "overflow_y": null,
5281
            "padding": null,
5282
            "right": null,
5283
            "top": null,
5284
            "visibility": null,
5285
            "width": null
5286
          }
5287
        },
5288
        "6b654ce3193745208af00288d6f9d5f9": {
5289
          "model_module": "@jupyter-widgets/controls",
5290
          "model_name": "ProgressStyleModel",
5291
          "model_module_version": "1.5.0",
5292
          "state": {
5293
            "_model_module": "@jupyter-widgets/controls",
5294
            "_model_module_version": "1.5.0",
5295
            "_model_name": "ProgressStyleModel",
5296
            "_view_count": null,
5297
            "_view_module": "@jupyter-widgets/base",
5298
            "_view_module_version": "1.2.0",
5299
            "_view_name": "StyleView",
5300
            "bar_color": null,
5301
            "description_width": ""
5302
          }
5303
        },
5304
        "681653beca9b4a6591f7008e0ff5ac3b": {
5305
          "model_module": "@jupyter-widgets/base",
5306
          "model_name": "LayoutModel",
5307
          "model_module_version": "1.2.0",
5308
          "state": {
5309
            "_model_module": "@jupyter-widgets/base",
5310
            "_model_module_version": "1.2.0",
5311
            "_model_name": "LayoutModel",
5312
            "_view_count": null,
5313
            "_view_module": "@jupyter-widgets/base",
5314
            "_view_module_version": "1.2.0",
5315
            "_view_name": "LayoutView",
5316
            "align_content": null,
5317
            "align_items": null,
5318
            "align_self": null,
5319
            "border": null,
5320
            "bottom": null,
5321
            "display": null,
5322
            "flex": null,
5323
            "flex_flow": null,
5324
            "grid_area": null,
5325
            "grid_auto_columns": null,
5326
            "grid_auto_flow": null,
5327
            "grid_auto_rows": null,
5328
            "grid_column": null,
5329
            "grid_gap": null,
5330
            "grid_row": null,
5331
            "grid_template_areas": null,
5332
            "grid_template_columns": null,
5333
            "grid_template_rows": null,
5334
            "height": null,
5335
            "justify_content": null,
5336
            "justify_items": null,
5337
            "left": null,
5338
            "margin": null,
5339
            "max_height": null,
5340
            "max_width": null,
5341
            "min_height": null,
5342
            "min_width": null,
5343
            "object_fit": null,
5344
            "object_position": null,
5345
            "order": null,
5346
            "overflow": null,
5347
            "overflow_x": null,
5348
            "overflow_y": null,
5349
            "padding": null,
5350
            "right": null,
5351
            "top": null,
5352
            "visibility": null,
5353
            "width": null
5354
          }
5355
        },
5356
        "997bd19e08ff48bc92a83487598be156": {
5357
          "model_module": "@jupyter-widgets/controls",
5358
          "model_name": "DescriptionStyleModel",
5359
          "model_module_version": "1.5.0",
5360
          "state": {
5361
            "_model_module": "@jupyter-widgets/controls",
5362
            "_model_module_version": "1.5.0",
5363
            "_model_name": "DescriptionStyleModel",
5364
            "_view_count": null,
5365
            "_view_module": "@jupyter-widgets/base",
5366
            "_view_module_version": "1.2.0",
5367
            "_view_name": "StyleView",
5368
            "description_width": ""
5369
          }
5370
        },
5371
        "27e56e4591da430fb5f62b5d49df7e9e": {
5372
          "model_module": "@jupyter-widgets/controls",
5373
          "model_name": "HBoxModel",
5374
          "model_module_version": "1.5.0",
5375
          "state": {
5376
            "_dom_classes": [],
5377
            "_model_module": "@jupyter-widgets/controls",
5378
            "_model_module_version": "1.5.0",
5379
            "_model_name": "HBoxModel",
5380
            "_view_count": null,
5381
            "_view_module": "@jupyter-widgets/controls",
5382
            "_view_module_version": "1.5.0",
5383
            "_view_name": "HBoxView",
5384
            "box_style": "",
5385
            "children": [
5386
              "IPY_MODEL_b90e6e929c164e3384cb0067555f66a4",
5387
              "IPY_MODEL_5fb49e2af10d452c9558f6f2b7551b16",
5388
              "IPY_MODEL_a6547c497b5b44b59c1de056965de351"
5389
            ],
5390
            "layout": "IPY_MODEL_8732438e1da948e6a4f74cde7a25eb57"
5391
          }
5392
        },
5393
        "b90e6e929c164e3384cb0067555f66a4": {
5394
          "model_module": "@jupyter-widgets/controls",
5395
          "model_name": "HTMLModel",
5396
          "model_module_version": "1.5.0",
5397
          "state": {
5398
            "_dom_classes": [],
5399
            "_model_module": "@jupyter-widgets/controls",
5400
            "_model_module_version": "1.5.0",
5401
            "_model_name": "HTMLModel",
5402
            "_view_count": null,
5403
            "_view_module": "@jupyter-widgets/controls",
5404
            "_view_module_version": "1.5.0",
5405
            "_view_name": "HTMLView",
5406
            "description": "",
5407
            "description_tooltip": null,
5408
            "layout": "IPY_MODEL_cdd90757935f45668a81520522e3f057",
5409
            "placeholder": "​",
5410
            "style": "IPY_MODEL_aa2269ddef7f4e66a42973e5fd3e568f",
5411
            "value": "Downloading (…)neration_config.json: 100%"
5412
          }
5413
        },
5414
        "5fb49e2af10d452c9558f6f2b7551b16": {
5415
          "model_module": "@jupyter-widgets/controls",
5416
          "model_name": "FloatProgressModel",
5417
          "model_module_version": "1.5.0",
5418
          "state": {
5419
            "_dom_classes": [],
5420
            "_model_module": "@jupyter-widgets/controls",
5421
            "_model_module_version": "1.5.0",
5422
            "_model_name": "FloatProgressModel",
5423
            "_view_count": null,
5424
            "_view_module": "@jupyter-widgets/controls",
5425
            "_view_module_version": "1.5.0",
5426
            "_view_name": "ProgressView",
5427
            "bar_style": "success",
5428
            "description": "",
5429
            "description_tooltip": null,
5430
            "layout": "IPY_MODEL_a9d745f127214a4289bf880d65899dd3",
5431
            "max": 69,
5432
            "min": 0,
5433
            "orientation": "horizontal",
5434
            "style": "IPY_MODEL_90884fd8a8d24859b4f94aac4041cfe4",
5435
            "value": 69
5436
          }
5437
        },
5438
        "a6547c497b5b44b59c1de056965de351": {
5439
          "model_module": "@jupyter-widgets/controls",
5440
          "model_name": "HTMLModel",
5441
          "model_module_version": "1.5.0",
5442
          "state": {
5443
            "_dom_classes": [],
5444
            "_model_module": "@jupyter-widgets/controls",
5445
            "_model_module_version": "1.5.0",
5446
            "_model_name": "HTMLModel",
5447
            "_view_count": null,
5448
            "_view_module": "@jupyter-widgets/controls",
5449
            "_view_module_version": "1.5.0",
5450
            "_view_name": "HTMLView",
5451
            "description": "",
5452
            "description_tooltip": null,
5453
            "layout": "IPY_MODEL_0fced73c513242fabd2fc4eb30df1e21",
5454
            "placeholder": "​",
5455
            "style": "IPY_MODEL_22d1d55d6580458fb8fdb4af38ec4690",
5456
            "value": " 69.0/69.0 [00:00&lt;00:00, 4.76kB/s]"
5457
          }
5458
        },
5459
        "8732438e1da948e6a4f74cde7a25eb57": {
5460
          "model_module": "@jupyter-widgets/base",
5461
          "model_name": "LayoutModel",
5462
          "model_module_version": "1.2.0",
5463
          "state": {
5464
            "_model_module": "@jupyter-widgets/base",
5465
            "_model_module_version": "1.2.0",
5466
            "_model_name": "LayoutModel",
5467
            "_view_count": null,
5468
            "_view_module": "@jupyter-widgets/base",
5469
            "_view_module_version": "1.2.0",
5470
            "_view_name": "LayoutView",
5471
            "align_content": null,
5472
            "align_items": null,
5473
            "align_self": null,
5474
            "border": null,
5475
            "bottom": null,
5476
            "display": null,
5477
            "flex": null,
5478
            "flex_flow": null,
5479
            "grid_area": null,
5480
            "grid_auto_columns": null,
5481
            "grid_auto_flow": null,
5482
            "grid_auto_rows": null,
5483
            "grid_column": null,
5484
            "grid_gap": null,
5485
            "grid_row": null,
5486
            "grid_template_areas": null,
5487
            "grid_template_columns": null,
5488
            "grid_template_rows": null,
5489
            "height": null,
5490
            "justify_content": null,
5491
            "justify_items": null,
5492
            "left": null,
5493
            "margin": null,
5494
            "max_height": null,
5495
            "max_width": null,
5496
            "min_height": null,
5497
            "min_width": null,
5498
            "object_fit": null,
5499
            "object_position": null,
5500
            "order": null,
5501
            "overflow": null,
5502
            "overflow_x": null,
5503
            "overflow_y": null,
5504
            "padding": null,
5505
            "right": null,
5506
            "top": null,
5507
            "visibility": null,
5508
            "width": null
5509
          }
5510
        },
5511
        "cdd90757935f45668a81520522e3f057": {
5512
          "model_module": "@jupyter-widgets/base",
5513
          "model_name": "LayoutModel",
5514
          "model_module_version": "1.2.0",
5515
          "state": {
5516
            "_model_module": "@jupyter-widgets/base",
5517
            "_model_module_version": "1.2.0",
5518
            "_model_name": "LayoutModel",
5519
            "_view_count": null,
5520
            "_view_module": "@jupyter-widgets/base",
5521
            "_view_module_version": "1.2.0",
5522
            "_view_name": "LayoutView",
5523
            "align_content": null,
5524
            "align_items": null,
5525
            "align_self": null,
5526
            "border": null,
5527
            "bottom": null,
5528
            "display": null,
5529
            "flex": null,
5530
            "flex_flow": null,
5531
            "grid_area": null,
5532
            "grid_auto_columns": null,
5533
            "grid_auto_flow": null,
5534
            "grid_auto_rows": null,
5535
            "grid_column": null,
5536
            "grid_gap": null,
5537
            "grid_row": null,
5538
            "grid_template_areas": null,
5539
            "grid_template_columns": null,
5540
            "grid_template_rows": null,
5541
            "height": null,
5542
            "justify_content": null,
5543
            "justify_items": null,
5544
            "left": null,
5545
            "margin": null,
5546
            "max_height": null,
5547
            "max_width": null,
5548
            "min_height": null,
5549
            "min_width": null,
5550
            "object_fit": null,
5551
            "object_position": null,
5552
            "order": null,
5553
            "overflow": null,
5554
            "overflow_x": null,
5555
            "overflow_y": null,
5556
            "padding": null,
5557
            "right": null,
5558
            "top": null,
5559
            "visibility": null,
5560
            "width": null
5561
          }
5562
        },
5563
        "aa2269ddef7f4e66a42973e5fd3e568f": {
5564
          "model_module": "@jupyter-widgets/controls",
5565
          "model_name": "DescriptionStyleModel",
5566
          "model_module_version": "1.5.0",
5567
          "state": {
5568
            "_model_module": "@jupyter-widgets/controls",
5569
            "_model_module_version": "1.5.0",
5570
            "_model_name": "DescriptionStyleModel",
5571
            "_view_count": null,
5572
            "_view_module": "@jupyter-widgets/base",
5573
            "_view_module_version": "1.2.0",
5574
            "_view_name": "StyleView",
5575
            "description_width": ""
5576
          }
5577
        },
5578
        "a9d745f127214a4289bf880d65899dd3": {
5579
          "model_module": "@jupyter-widgets/base",
5580
          "model_name": "LayoutModel",
5581
          "model_module_version": "1.2.0",
5582
          "state": {
5583
            "_model_module": "@jupyter-widgets/base",
5584
            "_model_module_version": "1.2.0",
5585
            "_model_name": "LayoutModel",
5586
            "_view_count": null,
5587
            "_view_module": "@jupyter-widgets/base",
5588
            "_view_module_version": "1.2.0",
5589
            "_view_name": "LayoutView",
5590
            "align_content": null,
5591
            "align_items": null,
5592
            "align_self": null,
5593
            "border": null,
5594
            "bottom": null,
5595
            "display": null,
5596
            "flex": null,
5597
            "flex_flow": null,
5598
            "grid_area": null,
5599
            "grid_auto_columns": null,
5600
            "grid_auto_flow": null,
5601
            "grid_auto_rows": null,
5602
            "grid_column": null,
5603
            "grid_gap": null,
5604
            "grid_row": null,
5605
            "grid_template_areas": null,
5606
            "grid_template_columns": null,
5607
            "grid_template_rows": null,
5608
            "height": null,
5609
            "justify_content": null,
5610
            "justify_items": null,
5611
            "left": null,
5612
            "margin": null,
5613
            "max_height": null,
5614
            "max_width": null,
5615
            "min_height": null,
5616
            "min_width": null,
5617
            "object_fit": null,
5618
            "object_position": null,
5619
            "order": null,
5620
            "overflow": null,
5621
            "overflow_x": null,
5622
            "overflow_y": null,
5623
            "padding": null,
5624
            "right": null,
5625
            "top": null,
5626
            "visibility": null,
5627
            "width": null
5628
          }
5629
        },
5630
        "90884fd8a8d24859b4f94aac4041cfe4": {
5631
          "model_module": "@jupyter-widgets/controls",
5632
          "model_name": "ProgressStyleModel",
5633
          "model_module_version": "1.5.0",
5634
          "state": {
5635
            "_model_module": "@jupyter-widgets/controls",
5636
            "_model_module_version": "1.5.0",
5637
            "_model_name": "ProgressStyleModel",
5638
            "_view_count": null,
5639
            "_view_module": "@jupyter-widgets/base",
5640
            "_view_module_version": "1.2.0",
5641
            "_view_name": "StyleView",
5642
            "bar_color": null,
5643
            "description_width": ""
5644
          }
5645
        },
5646
        "0fced73c513242fabd2fc4eb30df1e21": {
5647
          "model_module": "@jupyter-widgets/base",
5648
          "model_name": "LayoutModel",
5649
          "model_module_version": "1.2.0",
5650
          "state": {
5651
            "_model_module": "@jupyter-widgets/base",
5652
            "_model_module_version": "1.2.0",
5653
            "_model_name": "LayoutModel",
5654
            "_view_count": null,
5655
            "_view_module": "@jupyter-widgets/base",
5656
            "_view_module_version": "1.2.0",
5657
            "_view_name": "LayoutView",
5658
            "align_content": null,
5659
            "align_items": null,
5660
            "align_self": null,
5661
            "border": null,
5662
            "bottom": null,
5663
            "display": null,
5664
            "flex": null,
5665
            "flex_flow": null,
5666
            "grid_area": null,
5667
            "grid_auto_columns": null,
5668
            "grid_auto_flow": null,
5669
            "grid_auto_rows": null,
5670
            "grid_column": null,
5671
            "grid_gap": null,
5672
            "grid_row": null,
5673
            "grid_template_areas": null,
5674
            "grid_template_columns": null,
5675
            "grid_template_rows": null,
5676
            "height": null,
5677
            "justify_content": null,
5678
            "justify_items": null,
5679
            "left": null,
5680
            "margin": null,
5681
            "max_height": null,
5682
            "max_width": null,
5683
            "min_height": null,
5684
            "min_width": null,
5685
            "object_fit": null,
5686
            "object_position": null,
5687
            "order": null,
5688
            "overflow": null,
5689
            "overflow_x": null,
5690
            "overflow_y": null,
5691
            "padding": null,
5692
            "right": null,
5693
            "top": null,
5694
            "visibility": null,
5695
            "width": null
5696
          }
5697
        },
5698
        "22d1d55d6580458fb8fdb4af38ec4690": {
5699
          "model_module": "@jupyter-widgets/controls",
5700
          "model_name": "DescriptionStyleModel",
5701
          "model_module_version": "1.5.0",
5702
          "state": {
5703
            "_model_module": "@jupyter-widgets/controls",
5704
            "_model_module_version": "1.5.0",
5705
            "_model_name": "DescriptionStyleModel",
5706
            "_view_count": null,
5707
            "_view_module": "@jupyter-widgets/base",
5708
            "_view_module_version": "1.2.0",
5709
            "_view_name": "StyleView",
5710
            "description_width": ""
5711
          }
5712
        },
5713
        "a4acb6dc90144e729a615bb9b6e2db55": {
5714
          "model_module": "@jupyter-widgets/controls",
5715
          "model_name": "HBoxModel",
5716
          "model_module_version": "1.5.0",
5717
          "state": {
5718
            "_dom_classes": [],
5719
            "_model_module": "@jupyter-widgets/controls",
5720
            "_model_module_version": "1.5.0",
5721
            "_model_name": "HBoxModel",
5722
            "_view_count": null,
5723
            "_view_module": "@jupyter-widgets/controls",
5724
            "_view_module_version": "1.5.0",
5725
            "_view_name": "HBoxView",
5726
            "box_style": "",
5727
            "children": [
5728
              "IPY_MODEL_3bc8f617a46e47fb8676ffee9cc25fba",
5729
              "IPY_MODEL_fe82a3b74c5b4f79aa367fe5d8f79345",
5730
              "IPY_MODEL_387d62eb068e44619908b006079eacd7"
5731
            ],
5732
            "layout": "IPY_MODEL_e6d16b50198a450c876640e34d17140e"
5733
          }
5734
        },
5735
        "3bc8f617a46e47fb8676ffee9cc25fba": {
5736
          "model_module": "@jupyter-widgets/controls",
5737
          "model_name": "HTMLModel",
5738
          "model_module_version": "1.5.0",
5739
          "state": {
5740
            "_dom_classes": [],
5741
            "_model_module": "@jupyter-widgets/controls",
5742
            "_model_module_version": "1.5.0",
5743
            "_model_name": "HTMLModel",
5744
            "_view_count": null,
5745
            "_view_module": "@jupyter-widgets/controls",
5746
            "_view_module_version": "1.5.0",
5747
            "_view_name": "HTMLView",
5748
            "description": "",
5749
            "description_tooltip": null,
5750
            "layout": "IPY_MODEL_b4a34fe788034852876cc1886c28042f",
5751
            "placeholder": "​",
5752
            "style": "IPY_MODEL_265d6ad184a74be9b9e8d7378bb98f8d",
5753
            "value": "Downloading (…)okenizer_config.json: 100%"
5754
          }
5755
        },
5756
        "fe82a3b74c5b4f79aa367fe5d8f79345": {
5757
          "model_module": "@jupyter-widgets/controls",
5758
          "model_name": "FloatProgressModel",
5759
          "model_module_version": "1.5.0",
5760
          "state": {
5761
            "_dom_classes": [],
5762
            "_model_module": "@jupyter-widgets/controls",
5763
            "_model_module_version": "1.5.0",
5764
            "_model_name": "FloatProgressModel",
5765
            "_view_count": null,
5766
            "_view_module": "@jupyter-widgets/controls",
5767
            "_view_module_version": "1.5.0",
5768
            "_view_name": "ProgressView",
5769
            "bar_style": "success",
5770
            "description": "",
5771
            "description_tooltip": null,
5772
            "layout": "IPY_MODEL_e25b91678ed246cd997cec87e918c079",
5773
            "max": 237,
5774
            "min": 0,
5775
            "orientation": "horizontal",
5776
            "style": "IPY_MODEL_7bf39b13ce4148ca8fe508c73b63e413",
5777
            "value": 237
5778
          }
5779
        },
5780
        "387d62eb068e44619908b006079eacd7": {
5781
          "model_module": "@jupyter-widgets/controls",
5782
          "model_name": "HTMLModel",
5783
          "model_module_version": "1.5.0",
5784
          "state": {
5785
            "_dom_classes": [],
5786
            "_model_module": "@jupyter-widgets/controls",
5787
            "_model_module_version": "1.5.0",
5788
            "_model_name": "HTMLModel",
5789
            "_view_count": null,
5790
            "_view_module": "@jupyter-widgets/controls",
5791
            "_view_module_version": "1.5.0",
5792
            "_view_name": "HTMLView",
5793
            "description": "",
5794
            "description_tooltip": null,
5795
            "layout": "IPY_MODEL_b0e8f79bf6b74f08801f385b4c7aadee",
5796
            "placeholder": "​",
5797
            "style": "IPY_MODEL_8a8d6a4614e14aaeb03e4bfa9b8a0741",
5798
            "value": " 237/237 [00:00&lt;00:00, 13.1kB/s]"
5799
          }
5800
        },
5801
        "e6d16b50198a450c876640e34d17140e": {
5802
          "model_module": "@jupyter-widgets/base",
5803
          "model_name": "LayoutModel",
5804
          "model_module_version": "1.2.0",
5805
          "state": {
5806
            "_model_module": "@jupyter-widgets/base",
5807
            "_model_module_version": "1.2.0",
5808
            "_model_name": "LayoutModel",
5809
            "_view_count": null,
5810
            "_view_module": "@jupyter-widgets/base",
5811
            "_view_module_version": "1.2.0",
5812
            "_view_name": "LayoutView",
5813
            "align_content": null,
5814
            "align_items": null,
5815
            "align_self": null,
5816
            "border": null,
5817
            "bottom": null,
5818
            "display": null,
5819
            "flex": null,
5820
            "flex_flow": null,
5821
            "grid_area": null,
5822
            "grid_auto_columns": null,
5823
            "grid_auto_flow": null,
5824
            "grid_auto_rows": null,
5825
            "grid_column": null,
5826
            "grid_gap": null,
5827
            "grid_row": null,
5828
            "grid_template_areas": null,
5829
            "grid_template_columns": null,
5830
            "grid_template_rows": null,
5831
            "height": null,
5832
            "justify_content": null,
5833
            "justify_items": null,
5834
            "left": null,
5835
            "margin": null,
5836
            "max_height": null,
5837
            "max_width": null,
5838
            "min_height": null,
5839
            "min_width": null,
5840
            "object_fit": null,
5841
            "object_position": null,
5842
            "order": null,
5843
            "overflow": null,
5844
            "overflow_x": null,
5845
            "overflow_y": null,
5846
            "padding": null,
5847
            "right": null,
5848
            "top": null,
5849
            "visibility": null,
5850
            "width": null
5851
          }
5852
        },
5853
        "b4a34fe788034852876cc1886c28042f": {
5854
          "model_module": "@jupyter-widgets/base",
5855
          "model_name": "LayoutModel",
5856
          "model_module_version": "1.2.0",
5857
          "state": {
5858
            "_model_module": "@jupyter-widgets/base",
5859
            "_model_module_version": "1.2.0",
5860
            "_model_name": "LayoutModel",
5861
            "_view_count": null,
5862
            "_view_module": "@jupyter-widgets/base",
5863
            "_view_module_version": "1.2.0",
5864
            "_view_name": "LayoutView",
5865
            "align_content": null,
5866
            "align_items": null,
5867
            "align_self": null,
5868
            "border": null,
5869
            "bottom": null,
5870
            "display": null,
5871
            "flex": null,
5872
            "flex_flow": null,
5873
            "grid_area": null,
5874
            "grid_auto_columns": null,
5875
            "grid_auto_flow": null,
5876
            "grid_auto_rows": null,
5877
            "grid_column": null,
5878
            "grid_gap": null,
5879
            "grid_row": null,
5880
            "grid_template_areas": null,
5881
            "grid_template_columns": null,
5882
            "grid_template_rows": null,
5883
            "height": null,
5884
            "justify_content": null,
5885
            "justify_items": null,
5886
            "left": null,
5887
            "margin": null,
5888
            "max_height": null,
5889
            "max_width": null,
5890
            "min_height": null,
5891
            "min_width": null,
5892
            "object_fit": null,
5893
            "object_position": null,
5894
            "order": null,
5895
            "overflow": null,
5896
            "overflow_x": null,
5897
            "overflow_y": null,
5898
            "padding": null,
5899
            "right": null,
5900
            "top": null,
5901
            "visibility": null,
5902
            "width": null
5903
          }
5904
        },
5905
        "265d6ad184a74be9b9e8d7378bb98f8d": {
5906
          "model_module": "@jupyter-widgets/controls",
5907
          "model_name": "DescriptionStyleModel",
5908
          "model_module_version": "1.5.0",
5909
          "state": {
5910
            "_model_module": "@jupyter-widgets/controls",
5911
            "_model_module_version": "1.5.0",
5912
            "_model_name": "DescriptionStyleModel",
5913
            "_view_count": null,
5914
            "_view_module": "@jupyter-widgets/base",
5915
            "_view_module_version": "1.2.0",
5916
            "_view_name": "StyleView",
5917
            "description_width": ""
5918
          }
5919
        },
5920
        "e25b91678ed246cd997cec87e918c079": {
5921
          "model_module": "@jupyter-widgets/base",
5922
          "model_name": "LayoutModel",
5923
          "model_module_version": "1.2.0",
5924
          "state": {
5925
            "_model_module": "@jupyter-widgets/base",
5926
            "_model_module_version": "1.2.0",
5927
            "_model_name": "LayoutModel",
5928
            "_view_count": null,
5929
            "_view_module": "@jupyter-widgets/base",
5930
            "_view_module_version": "1.2.0",
5931
            "_view_name": "LayoutView",
5932
            "align_content": null,
5933
            "align_items": null,
5934
            "align_self": null,
5935
            "border": null,
5936
            "bottom": null,
5937
            "display": null,
5938
            "flex": null,
5939
            "flex_flow": null,
5940
            "grid_area": null,
5941
            "grid_auto_columns": null,
5942
            "grid_auto_flow": null,
5943
            "grid_auto_rows": null,
5944
            "grid_column": null,
5945
            "grid_gap": null,
5946
            "grid_row": null,
5947
            "grid_template_areas": null,
5948
            "grid_template_columns": null,
5949
            "grid_template_rows": null,
5950
            "height": null,
5951
            "justify_content": null,
5952
            "justify_items": null,
5953
            "left": null,
5954
            "margin": null,
5955
            "max_height": null,
5956
            "max_width": null,
5957
            "min_height": null,
5958
            "min_width": null,
5959
            "object_fit": null,
5960
            "object_position": null,
5961
            "order": null,
5962
            "overflow": null,
5963
            "overflow_x": null,
5964
            "overflow_y": null,
5965
            "padding": null,
5966
            "right": null,
5967
            "top": null,
5968
            "visibility": null,
5969
            "width": null
5970
          }
5971
        },
5972
        "7bf39b13ce4148ca8fe508c73b63e413": {
5973
          "model_module": "@jupyter-widgets/controls",
5974
          "model_name": "ProgressStyleModel",
5975
          "model_module_version": "1.5.0",
5976
          "state": {
5977
            "_model_module": "@jupyter-widgets/controls",
5978
            "_model_module_version": "1.5.0",
5979
            "_model_name": "ProgressStyleModel",
5980
            "_view_count": null,
5981
            "_view_module": "@jupyter-widgets/base",
5982
            "_view_module_version": "1.2.0",
5983
            "_view_name": "StyleView",
5984
            "bar_color": null,
5985
            "description_width": ""
5986
          }
5987
        },
5988
        "b0e8f79bf6b74f08801f385b4c7aadee": {
5989
          "model_module": "@jupyter-widgets/base",
5990
          "model_name": "LayoutModel",
5991
          "model_module_version": "1.2.0",
5992
          "state": {
5993
            "_model_module": "@jupyter-widgets/base",
5994
            "_model_module_version": "1.2.0",
5995
            "_model_name": "LayoutModel",
5996
            "_view_count": null,
5997
            "_view_module": "@jupyter-widgets/base",
5998
            "_view_module_version": "1.2.0",
5999
            "_view_name": "LayoutView",
6000
            "align_content": null,
6001
            "align_items": null,
6002
            "align_self": null,
6003
            "border": null,
6004
            "bottom": null,
6005
            "display": null,
6006
            "flex": null,
6007
            "flex_flow": null,
6008
            "grid_area": null,
6009
            "grid_auto_columns": null,
6010
            "grid_auto_flow": null,
6011
            "grid_auto_rows": null,
6012
            "grid_column": null,
6013
            "grid_gap": null,
6014
            "grid_row": null,
6015
            "grid_template_areas": null,
6016
            "grid_template_columns": null,
6017
            "grid_template_rows": null,
6018
            "height": null,
6019
            "justify_content": null,
6020
            "justify_items": null,
6021
            "left": null,
6022
            "margin": null,
6023
            "max_height": null,
6024
            "max_width": null,
6025
            "min_height": null,
6026
            "min_width": null,
6027
            "object_fit": null,
6028
            "object_position": null,
6029
            "order": null,
6030
            "overflow": null,
6031
            "overflow_x": null,
6032
            "overflow_y": null,
6033
            "padding": null,
6034
            "right": null,
6035
            "top": null,
6036
            "visibility": null,
6037
            "width": null
6038
          }
6039
        },
6040
        "8a8d6a4614e14aaeb03e4bfa9b8a0741": {
6041
          "model_module": "@jupyter-widgets/controls",
6042
          "model_name": "DescriptionStyleModel",
6043
          "model_module_version": "1.5.0",
6044
          "state": {
6045
            "_model_module": "@jupyter-widgets/controls",
6046
            "_model_module_version": "1.5.0",
6047
            "_model_name": "DescriptionStyleModel",
6048
            "_view_count": null,
6049
            "_view_module": "@jupyter-widgets/base",
6050
            "_view_module_version": "1.2.0",
6051
            "_view_name": "StyleView",
6052
            "description_width": ""
6053
          }
6054
        },
6055
        "f14e8afa14b74002af2be74b84d8b033": {
6056
          "model_module": "@jupyter-widgets/controls",
6057
          "model_name": "HBoxModel",
6058
          "model_module_version": "1.5.0",
6059
          "state": {
6060
            "_dom_classes": [],
6061
            "_model_module": "@jupyter-widgets/controls",
6062
            "_model_module_version": "1.5.0",
6063
            "_model_name": "HBoxModel",
6064
            "_view_count": null,
6065
            "_view_module": "@jupyter-widgets/controls",
6066
            "_view_module_version": "1.5.0",
6067
            "_view_name": "HBoxView",
6068
            "box_style": "",
6069
            "children": [
6070
              "IPY_MODEL_17cc56f07af34e588c3d3e0cdba0b458",
6071
              "IPY_MODEL_9439477ef5b64c1ba5c517d76c2c460f",
6072
              "IPY_MODEL_fc8787cef48c4befae588efa56f99adc"
6073
            ],
6074
            "layout": "IPY_MODEL_fd97aec74a1148b0b94de3f2194a0558"
6075
          }
6076
        },
6077
        "17cc56f07af34e588c3d3e0cdba0b458": {
6078
          "model_module": "@jupyter-widgets/controls",
6079
          "model_name": "HTMLModel",
6080
          "model_module_version": "1.5.0",
6081
          "state": {
6082
            "_dom_classes": [],
6083
            "_model_module": "@jupyter-widgets/controls",
6084
            "_model_module_version": "1.5.0",
6085
            "_model_name": "HTMLModel",
6086
            "_view_count": null,
6087
            "_view_module": "@jupyter-widgets/controls",
6088
            "_view_module_version": "1.5.0",
6089
            "_view_name": "HTMLView",
6090
            "description": "",
6091
            "description_tooltip": null,
6092
            "layout": "IPY_MODEL_cf54b45acb1d40d4a34189e76ffa831c",
6093
            "placeholder": "​",
6094
            "style": "IPY_MODEL_1cbd0d65bcf9496c85e07225be76ffdf",
6095
            "value": "Downloading (…)olve/main/vocab.json: 100%"
6096
          }
6097
        },
6098
        "9439477ef5b64c1ba5c517d76c2c460f": {
6099
          "model_module": "@jupyter-widgets/controls",
6100
          "model_name": "FloatProgressModel",
6101
          "model_module_version": "1.5.0",
6102
          "state": {
6103
            "_dom_classes": [],
6104
            "_model_module": "@jupyter-widgets/controls",
6105
            "_model_module_version": "1.5.0",
6106
            "_model_name": "FloatProgressModel",
6107
            "_view_count": null,
6108
            "_view_module": "@jupyter-widgets/controls",
6109
            "_view_module_version": "1.5.0",
6110
            "_view_name": "ProgressView",
6111
            "bar_style": "success",
6112
            "description": "",
6113
            "description_tooltip": null,
6114
            "layout": "IPY_MODEL_4689e3a07503492eb11986bf5e8a864f",
6115
            "max": 798156,
6116
            "min": 0,
6117
            "orientation": "horizontal",
6118
            "style": "IPY_MODEL_4d443929f61f4991bc88caeb94adaaa3",
6119
            "value": 798156
6120
          }
6121
        },
6122
        "fc8787cef48c4befae588efa56f99adc": {
6123
          "model_module": "@jupyter-widgets/controls",
6124
          "model_name": "HTMLModel",
6125
          "model_module_version": "1.5.0",
6126
          "state": {
6127
            "_dom_classes": [],
6128
            "_model_module": "@jupyter-widgets/controls",
6129
            "_model_module_version": "1.5.0",
6130
            "_model_name": "HTMLModel",
6131
            "_view_count": null,
6132
            "_view_module": "@jupyter-widgets/controls",
6133
            "_view_module_version": "1.5.0",
6134
            "_view_name": "HTMLView",
6135
            "description": "",
6136
            "description_tooltip": null,
6137
            "layout": "IPY_MODEL_9f60e630e47841ba91855613da83e295",
6138
            "placeholder": "​",
6139
            "style": "IPY_MODEL_12332fa62a8f4b6f974eb37bf8eddaf2",
6140
            "value": " 798k/798k [00:00&lt;00:00, 16.8MB/s]"
6141
          }
6142
        },
6143
        "fd97aec74a1148b0b94de3f2194a0558": {
6144
          "model_module": "@jupyter-widgets/base",
6145
          "model_name": "LayoutModel",
6146
          "model_module_version": "1.2.0",
6147
          "state": {
6148
            "_model_module": "@jupyter-widgets/base",
6149
            "_model_module_version": "1.2.0",
6150
            "_model_name": "LayoutModel",
6151
            "_view_count": null,
6152
            "_view_module": "@jupyter-widgets/base",
6153
            "_view_module_version": "1.2.0",
6154
            "_view_name": "LayoutView",
6155
            "align_content": null,
6156
            "align_items": null,
6157
            "align_self": null,
6158
            "border": null,
6159
            "bottom": null,
6160
            "display": null,
6161
            "flex": null,
6162
            "flex_flow": null,
6163
            "grid_area": null,
6164
            "grid_auto_columns": null,
6165
            "grid_auto_flow": null,
6166
            "grid_auto_rows": null,
6167
            "grid_column": null,
6168
            "grid_gap": null,
6169
            "grid_row": null,
6170
            "grid_template_areas": null,
6171
            "grid_template_columns": null,
6172
            "grid_template_rows": null,
6173
            "height": null,
6174
            "justify_content": null,
6175
            "justify_items": null,
6176
            "left": null,
6177
            "margin": null,
6178
            "max_height": null,
6179
            "max_width": null,
6180
            "min_height": null,
6181
            "min_width": null,
6182
            "object_fit": null,
6183
            "object_position": null,
6184
            "order": null,
6185
            "overflow": null,
6186
            "overflow_x": null,
6187
            "overflow_y": null,
6188
            "padding": null,
6189
            "right": null,
6190
            "top": null,
6191
            "visibility": null,
6192
            "width": null
6193
          }
6194
        },
6195
        "cf54b45acb1d40d4a34189e76ffa831c": {
6196
          "model_module": "@jupyter-widgets/base",
6197
          "model_name": "LayoutModel",
6198
          "model_module_version": "1.2.0",
6199
          "state": {
6200
            "_model_module": "@jupyter-widgets/base",
6201
            "_model_module_version": "1.2.0",
6202
            "_model_name": "LayoutModel",
6203
            "_view_count": null,
6204
            "_view_module": "@jupyter-widgets/base",
6205
            "_view_module_version": "1.2.0",
6206
            "_view_name": "LayoutView",
6207
            "align_content": null,
6208
            "align_items": null,
6209
            "align_self": null,
6210
            "border": null,
6211
            "bottom": null,
6212
            "display": null,
6213
            "flex": null,
6214
            "flex_flow": null,
6215
            "grid_area": null,
6216
            "grid_auto_columns": null,
6217
            "grid_auto_flow": null,
6218
            "grid_auto_rows": null,
6219
            "grid_column": null,
6220
            "grid_gap": null,
6221
            "grid_row": null,
6222
            "grid_template_areas": null,
6223
            "grid_template_columns": null,
6224
            "grid_template_rows": null,
6225
            "height": null,
6226
            "justify_content": null,
6227
            "justify_items": null,
6228
            "left": null,
6229
            "margin": null,
6230
            "max_height": null,
6231
            "max_width": null,
6232
            "min_height": null,
6233
            "min_width": null,
6234
            "object_fit": null,
6235
            "object_position": null,
6236
            "order": null,
6237
            "overflow": null,
6238
            "overflow_x": null,
6239
            "overflow_y": null,
6240
            "padding": null,
6241
            "right": null,
6242
            "top": null,
6243
            "visibility": null,
6244
            "width": null
6245
          }
6246
        },
6247
        "1cbd0d65bcf9496c85e07225be76ffdf": {
6248
          "model_module": "@jupyter-widgets/controls",
6249
          "model_name": "DescriptionStyleModel",
6250
          "model_module_version": "1.5.0",
6251
          "state": {
6252
            "_model_module": "@jupyter-widgets/controls",
6253
            "_model_module_version": "1.5.0",
6254
            "_model_name": "DescriptionStyleModel",
6255
            "_view_count": null,
6256
            "_view_module": "@jupyter-widgets/base",
6257
            "_view_module_version": "1.2.0",
6258
            "_view_name": "StyleView",
6259
            "description_width": ""
6260
          }
6261
        },
6262
        "4689e3a07503492eb11986bf5e8a864f": {
6263
          "model_module": "@jupyter-widgets/base",
6264
          "model_name": "LayoutModel",
6265
          "model_module_version": "1.2.0",
6266
          "state": {
6267
            "_model_module": "@jupyter-widgets/base",
6268
            "_model_module_version": "1.2.0",
6269
            "_model_name": "LayoutModel",
6270
            "_view_count": null,
6271
            "_view_module": "@jupyter-widgets/base",
6272
            "_view_module_version": "1.2.0",
6273
            "_view_name": "LayoutView",
6274
            "align_content": null,
6275
            "align_items": null,
6276
            "align_self": null,
6277
            "border": null,
6278
            "bottom": null,
6279
            "display": null,
6280
            "flex": null,
6281
            "flex_flow": null,
6282
            "grid_area": null,
6283
            "grid_auto_columns": null,
6284
            "grid_auto_flow": null,
6285
            "grid_auto_rows": null,
6286
            "grid_column": null,
6287
            "grid_gap": null,
6288
            "grid_row": null,
6289
            "grid_template_areas": null,
6290
            "grid_template_columns": null,
6291
            "grid_template_rows": null,
6292
            "height": null,
6293
            "justify_content": null,
6294
            "justify_items": null,
6295
            "left": null,
6296
            "margin": null,
6297
            "max_height": null,
6298
            "max_width": null,
6299
            "min_height": null,
6300
            "min_width": null,
6301
            "object_fit": null,
6302
            "object_position": null,
6303
            "order": null,
6304
            "overflow": null,
6305
            "overflow_x": null,
6306
            "overflow_y": null,
6307
            "padding": null,
6308
            "right": null,
6309
            "top": null,
6310
            "visibility": null,
6311
            "width": null
6312
          }
6313
        },
6314
        "4d443929f61f4991bc88caeb94adaaa3": {
6315
          "model_module": "@jupyter-widgets/controls",
6316
          "model_name": "ProgressStyleModel",
6317
          "model_module_version": "1.5.0",
6318
          "state": {
6319
            "_model_module": "@jupyter-widgets/controls",
6320
            "_model_module_version": "1.5.0",
6321
            "_model_name": "ProgressStyleModel",
6322
            "_view_count": null,
6323
            "_view_module": "@jupyter-widgets/base",
6324
            "_view_module_version": "1.2.0",
6325
            "_view_name": "StyleView",
6326
            "bar_color": null,
6327
            "description_width": ""
6328
          }
6329
        },
6330
        "9f60e630e47841ba91855613da83e295": {
6331
          "model_module": "@jupyter-widgets/base",
6332
          "model_name": "LayoutModel",
6333
          "model_module_version": "1.2.0",
6334
          "state": {
6335
            "_model_module": "@jupyter-widgets/base",
6336
            "_model_module_version": "1.2.0",
6337
            "_model_name": "LayoutModel",
6338
            "_view_count": null,
6339
            "_view_module": "@jupyter-widgets/base",
6340
            "_view_module_version": "1.2.0",
6341
            "_view_name": "LayoutView",
6342
            "align_content": null,
6343
            "align_items": null,
6344
            "align_self": null,
6345
            "border": null,
6346
            "bottom": null,
6347
            "display": null,
6348
            "flex": null,
6349
            "flex_flow": null,
6350
            "grid_area": null,
6351
            "grid_auto_columns": null,
6352
            "grid_auto_flow": null,
6353
            "grid_auto_rows": null,
6354
            "grid_column": null,
6355
            "grid_gap": null,
6356
            "grid_row": null,
6357
            "grid_template_areas": null,
6358
            "grid_template_columns": null,
6359
            "grid_template_rows": null,
6360
            "height": null,
6361
            "justify_content": null,
6362
            "justify_items": null,
6363
            "left": null,
6364
            "margin": null,
6365
            "max_height": null,
6366
            "max_width": null,
6367
            "min_height": null,
6368
            "min_width": null,
6369
            "object_fit": null,
6370
            "object_position": null,
6371
            "order": null,
6372
            "overflow": null,
6373
            "overflow_x": null,
6374
            "overflow_y": null,
6375
            "padding": null,
6376
            "right": null,
6377
            "top": null,
6378
            "visibility": null,
6379
            "width": null
6380
          }
6381
        },
6382
        "12332fa62a8f4b6f974eb37bf8eddaf2": {
6383
          "model_module": "@jupyter-widgets/controls",
6384
          "model_name": "DescriptionStyleModel",
6385
          "model_module_version": "1.5.0",
6386
          "state": {
6387
            "_model_module": "@jupyter-widgets/controls",
6388
            "_model_module_version": "1.5.0",
6389
            "_model_name": "DescriptionStyleModel",
6390
            "_view_count": null,
6391
            "_view_module": "@jupyter-widgets/base",
6392
            "_view_module_version": "1.2.0",
6393
            "_view_name": "StyleView",
6394
            "description_width": ""
6395
          }
6396
        },
6397
        "e333b53d363b47648ab6694e25b68ad7": {
6398
          "model_module": "@jupyter-widgets/controls",
6399
          "model_name": "HBoxModel",
6400
          "model_module_version": "1.5.0",
6401
          "state": {
6402
            "_dom_classes": [],
6403
            "_model_module": "@jupyter-widgets/controls",
6404
            "_model_module_version": "1.5.0",
6405
            "_model_name": "HBoxModel",
6406
            "_view_count": null,
6407
            "_view_module": "@jupyter-widgets/controls",
6408
            "_view_module_version": "1.5.0",
6409
            "_view_name": "HBoxView",
6410
            "box_style": "",
6411
            "children": [
6412
              "IPY_MODEL_5e9ebdfb88fa413b88fdf2dd5bc2a3a1",
6413
              "IPY_MODEL_058ff0fedb9545199d11930a9aa1deec",
6414
              "IPY_MODEL_6996b093bc5a4ba385dfd134f687e8db"
6415
            ],
6416
            "layout": "IPY_MODEL_e1a107dbb4784261b608c382895e7daf"
6417
          }
6418
        },
6419
        "5e9ebdfb88fa413b88fdf2dd5bc2a3a1": {
6420
          "model_module": "@jupyter-widgets/controls",
6421
          "model_name": "HTMLModel",
6422
          "model_module_version": "1.5.0",
6423
          "state": {
6424
            "_dom_classes": [],
6425
            "_model_module": "@jupyter-widgets/controls",
6426
            "_model_module_version": "1.5.0",
6427
            "_model_name": "HTMLModel",
6428
            "_view_count": null,
6429
            "_view_module": "@jupyter-widgets/controls",
6430
            "_view_module_version": "1.5.0",
6431
            "_view_name": "HTMLView",
6432
            "description": "",
6433
            "description_tooltip": null,
6434
            "layout": "IPY_MODEL_73ef312d625542ccaf7994e9300acb1b",
6435
            "placeholder": "​",
6436
            "style": "IPY_MODEL_541a328e5cb84163a1295eeee4494d3f",
6437
            "value": "Downloading (…)olve/main/merges.txt: 100%"
6438
          }
6439
        },
6440
        "058ff0fedb9545199d11930a9aa1deec": {
6441
          "model_module": "@jupyter-widgets/controls",
6442
          "model_name": "FloatProgressModel",
6443
          "model_module_version": "1.5.0",
6444
          "state": {
6445
            "_dom_classes": [],
6446
            "_model_module": "@jupyter-widgets/controls",
6447
            "_model_module_version": "1.5.0",
6448
            "_model_name": "FloatProgressModel",
6449
            "_view_count": null,
6450
            "_view_module": "@jupyter-widgets/controls",
6451
            "_view_module_version": "1.5.0",
6452
            "_view_name": "ProgressView",
6453
            "bar_style": "success",
6454
            "description": "",
6455
            "description_tooltip": null,
6456
            "layout": "IPY_MODEL_db228a2b64c148d98f5db9bfbf2ac5af",
6457
            "max": 456318,
6458
            "min": 0,
6459
            "orientation": "horizontal",
6460
            "style": "IPY_MODEL_85455342596f4e90b98cc41da60b8cb6",
6461
            "value": 456318
6462
          }
6463
        },
6464
        "6996b093bc5a4ba385dfd134f687e8db": {
6465
          "model_module": "@jupyter-widgets/controls",
6466
          "model_name": "HTMLModel",
6467
          "model_module_version": "1.5.0",
6468
          "state": {
6469
            "_dom_classes": [],
6470
            "_model_module": "@jupyter-widgets/controls",
6471
            "_model_module_version": "1.5.0",
6472
            "_model_name": "HTMLModel",
6473
            "_view_count": null,
6474
            "_view_module": "@jupyter-widgets/controls",
6475
            "_view_module_version": "1.5.0",
6476
            "_view_name": "HTMLView",
6477
            "description": "",
6478
            "description_tooltip": null,
6479
            "layout": "IPY_MODEL_22b767cd81db4953959e78d71f604dce",
6480
            "placeholder": "​",
6481
            "style": "IPY_MODEL_9fb8334f33e84dc3a4bb3deaf1e7777c",
6482
            "value": " 456k/456k [00:00&lt;00:00, 8.57MB/s]"
6483
          }
6484
        },
6485
        "e1a107dbb4784261b608c382895e7daf": {
6486
          "model_module": "@jupyter-widgets/base",
6487
          "model_name": "LayoutModel",
6488
          "model_module_version": "1.2.0",
6489
          "state": {
6490
            "_model_module": "@jupyter-widgets/base",
6491
            "_model_module_version": "1.2.0",
6492
            "_model_name": "LayoutModel",
6493
            "_view_count": null,
6494
            "_view_module": "@jupyter-widgets/base",
6495
            "_view_module_version": "1.2.0",
6496
            "_view_name": "LayoutView",
6497
            "align_content": null,
6498
            "align_items": null,
6499
            "align_self": null,
6500
            "border": null,
6501
            "bottom": null,
6502
            "display": null,
6503
            "flex": null,
6504
            "flex_flow": null,
6505
            "grid_area": null,
6506
            "grid_auto_columns": null,
6507
            "grid_auto_flow": null,
6508
            "grid_auto_rows": null,
6509
            "grid_column": null,
6510
            "grid_gap": null,
6511
            "grid_row": null,
6512
            "grid_template_areas": null,
6513
            "grid_template_columns": null,
6514
            "grid_template_rows": null,
6515
            "height": null,
6516
            "justify_content": null,
6517
            "justify_items": null,
6518
            "left": null,
6519
            "margin": null,
6520
            "max_height": null,
6521
            "max_width": null,
6522
            "min_height": null,
6523
            "min_width": null,
6524
            "object_fit": null,
6525
            "object_position": null,
6526
            "order": null,
6527
            "overflow": null,
6528
            "overflow_x": null,
6529
            "overflow_y": null,
6530
            "padding": null,
6531
            "right": null,
6532
            "top": null,
6533
            "visibility": null,
6534
            "width": null
6535
          }
6536
        },
6537
        "73ef312d625542ccaf7994e9300acb1b": {
6538
          "model_module": "@jupyter-widgets/base",
6539
          "model_name": "LayoutModel",
6540
          "model_module_version": "1.2.0",
6541
          "state": {
6542
            "_model_module": "@jupyter-widgets/base",
6543
            "_model_module_version": "1.2.0",
6544
            "_model_name": "LayoutModel",
6545
            "_view_count": null,
6546
            "_view_module": "@jupyter-widgets/base",
6547
            "_view_module_version": "1.2.0",
6548
            "_view_name": "LayoutView",
6549
            "align_content": null,
6550
            "align_items": null,
6551
            "align_self": null,
6552
            "border": null,
6553
            "bottom": null,
6554
            "display": null,
6555
            "flex": null,
6556
            "flex_flow": null,
6557
            "grid_area": null,
6558
            "grid_auto_columns": null,
6559
            "grid_auto_flow": null,
6560
            "grid_auto_rows": null,
6561
            "grid_column": null,
6562
            "grid_gap": null,
6563
            "grid_row": null,
6564
            "grid_template_areas": null,
6565
            "grid_template_columns": null,
6566
            "grid_template_rows": null,
6567
            "height": null,
6568
            "justify_content": null,
6569
            "justify_items": null,
6570
            "left": null,
6571
            "margin": null,
6572
            "max_height": null,
6573
            "max_width": null,
6574
            "min_height": null,
6575
            "min_width": null,
6576
            "object_fit": null,
6577
            "object_position": null,
6578
            "order": null,
6579
            "overflow": null,
6580
            "overflow_x": null,
6581
            "overflow_y": null,
6582
            "padding": null,
6583
            "right": null,
6584
            "top": null,
6585
            "visibility": null,
6586
            "width": null
6587
          }
6588
        },
6589
        "541a328e5cb84163a1295eeee4494d3f": {
6590
          "model_module": "@jupyter-widgets/controls",
6591
          "model_name": "DescriptionStyleModel",
6592
          "model_module_version": "1.5.0",
6593
          "state": {
6594
            "_model_module": "@jupyter-widgets/controls",
6595
            "_model_module_version": "1.5.0",
6596
            "_model_name": "DescriptionStyleModel",
6597
            "_view_count": null,
6598
            "_view_module": "@jupyter-widgets/base",
6599
            "_view_module_version": "1.2.0",
6600
            "_view_name": "StyleView",
6601
            "description_width": ""
6602
          }
6603
        },
6604
        "db228a2b64c148d98f5db9bfbf2ac5af": {
6605
          "model_module": "@jupyter-widgets/base",
6606
          "model_name": "LayoutModel",
6607
          "model_module_version": "1.2.0",
6608
          "state": {
6609
            "_model_module": "@jupyter-widgets/base",
6610
            "_model_module_version": "1.2.0",
6611
            "_model_name": "LayoutModel",
6612
            "_view_count": null,
6613
            "_view_module": "@jupyter-widgets/base",
6614
            "_view_module_version": "1.2.0",
6615
            "_view_name": "LayoutView",
6616
            "align_content": null,
6617
            "align_items": null,
6618
            "align_self": null,
6619
            "border": null,
6620
            "bottom": null,
6621
            "display": null,
6622
            "flex": null,
6623
            "flex_flow": null,
6624
            "grid_area": null,
6625
            "grid_auto_columns": null,
6626
            "grid_auto_flow": null,
6627
            "grid_auto_rows": null,
6628
            "grid_column": null,
6629
            "grid_gap": null,
6630
            "grid_row": null,
6631
            "grid_template_areas": null,
6632
            "grid_template_columns": null,
6633
            "grid_template_rows": null,
6634
            "height": null,
6635
            "justify_content": null,
6636
            "justify_items": null,
6637
            "left": null,
6638
            "margin": null,
6639
            "max_height": null,
6640
            "max_width": null,
6641
            "min_height": null,
6642
            "min_width": null,
6643
            "object_fit": null,
6644
            "object_position": null,
6645
            "order": null,
6646
            "overflow": null,
6647
            "overflow_x": null,
6648
            "overflow_y": null,
6649
            "padding": null,
6650
            "right": null,
6651
            "top": null,
6652
            "visibility": null,
6653
            "width": null
6654
          }
6655
        },
6656
        "85455342596f4e90b98cc41da60b8cb6": {
6657
          "model_module": "@jupyter-widgets/controls",
6658
          "model_name": "ProgressStyleModel",
6659
          "model_module_version": "1.5.0",
6660
          "state": {
6661
            "_model_module": "@jupyter-widgets/controls",
6662
            "_model_module_version": "1.5.0",
6663
            "_model_name": "ProgressStyleModel",
6664
            "_view_count": null,
6665
            "_view_module": "@jupyter-widgets/base",
6666
            "_view_module_version": "1.2.0",
6667
            "_view_name": "StyleView",
6668
            "bar_color": null,
6669
            "description_width": ""
6670
          }
6671
        },
6672
        "22b767cd81db4953959e78d71f604dce": {
6673
          "model_module": "@jupyter-widgets/base",
6674
          "model_name": "LayoutModel",
6675
          "model_module_version": "1.2.0",
6676
          "state": {
6677
            "_model_module": "@jupyter-widgets/base",
6678
            "_model_module_version": "1.2.0",
6679
            "_model_name": "LayoutModel",
6680
            "_view_count": null,
6681
            "_view_module": "@jupyter-widgets/base",
6682
            "_view_module_version": "1.2.0",
6683
            "_view_name": "LayoutView",
6684
            "align_content": null,
6685
            "align_items": null,
6686
            "align_self": null,
6687
            "border": null,
6688
            "bottom": null,
6689
            "display": null,
6690
            "flex": null,
6691
            "flex_flow": null,
6692
            "grid_area": null,
6693
            "grid_auto_columns": null,
6694
            "grid_auto_flow": null,
6695
            "grid_auto_rows": null,
6696
            "grid_column": null,
6697
            "grid_gap": null,
6698
            "grid_row": null,
6699
            "grid_template_areas": null,
6700
            "grid_template_columns": null,
6701
            "grid_template_rows": null,
6702
            "height": null,
6703
            "justify_content": null,
6704
            "justify_items": null,
6705
            "left": null,
6706
            "margin": null,
6707
            "max_height": null,
6708
            "max_width": null,
6709
            "min_height": null,
6710
            "min_width": null,
6711
            "object_fit": null,
6712
            "object_position": null,
6713
            "order": null,
6714
            "overflow": null,
6715
            "overflow_x": null,
6716
            "overflow_y": null,
6717
            "padding": null,
6718
            "right": null,
6719
            "top": null,
6720
            "visibility": null,
6721
            "width": null
6722
          }
6723
        },
6724
        "9fb8334f33e84dc3a4bb3deaf1e7777c": {
6725
          "model_module": "@jupyter-widgets/controls",
6726
          "model_name": "DescriptionStyleModel",
6727
          "model_module_version": "1.5.0",
6728
          "state": {
6729
            "_model_module": "@jupyter-widgets/controls",
6730
            "_model_module_version": "1.5.0",
6731
            "_model_name": "DescriptionStyleModel",
6732
            "_view_count": null,
6733
            "_view_module": "@jupyter-widgets/base",
6734
            "_view_module_version": "1.2.0",
6735
            "_view_name": "StyleView",
6736
            "description_width": ""
6737
          }
6738
        },
6739
        "f6ee0db62fe14f1e86c972a4a157e315": {
6740
          "model_module": "@jupyter-widgets/controls",
6741
          "model_name": "HBoxModel",
6742
          "model_module_version": "1.5.0",
6743
          "state": {
6744
            "_dom_classes": [],
6745
            "_model_module": "@jupyter-widgets/controls",
6746
            "_model_module_version": "1.5.0",
6747
            "_model_name": "HBoxModel",
6748
            "_view_count": null,
6749
            "_view_module": "@jupyter-widgets/controls",
6750
            "_view_module_version": "1.5.0",
6751
            "_view_name": "HBoxView",
6752
            "box_style": "",
6753
            "children": [
6754
              "IPY_MODEL_f57698a07edd4a43b0b1f55e0d6b4a02",
6755
              "IPY_MODEL_9adaf92c8acf4b7ea94e5591cfe27707",
6756
              "IPY_MODEL_f1d7c8a0a78041b184d64a69f7ed0789"
6757
            ],
6758
            "layout": "IPY_MODEL_f4ca5f16039b4258b9c83768d211e757"
6759
          }
6760
        },
6761
        "f57698a07edd4a43b0b1f55e0d6b4a02": {
6762
          "model_module": "@jupyter-widgets/controls",
6763
          "model_name": "HTMLModel",
6764
          "model_module_version": "1.5.0",
6765
          "state": {
6766
            "_dom_classes": [],
6767
            "_model_module": "@jupyter-widgets/controls",
6768
            "_model_module_version": "1.5.0",
6769
            "_model_name": "HTMLModel",
6770
            "_view_count": null,
6771
            "_view_module": "@jupyter-widgets/controls",
6772
            "_view_module_version": "1.5.0",
6773
            "_view_name": "HTMLView",
6774
            "description": "",
6775
            "description_tooltip": null,
6776
            "layout": "IPY_MODEL_864288a708f545629900a29fb05f3d8b",
6777
            "placeholder": "​",
6778
            "style": "IPY_MODEL_746c0bfc3d90446ca10a16d7838441aa",
6779
            "value": "Downloading (…)/main/tokenizer.json: 100%"
6780
          }
6781
        },
6782
        "9adaf92c8acf4b7ea94e5591cfe27707": {
6783
          "model_module": "@jupyter-widgets/controls",
6784
          "model_name": "FloatProgressModel",
6785
          "model_module_version": "1.5.0",
6786
          "state": {
6787
            "_dom_classes": [],
6788
            "_model_module": "@jupyter-widgets/controls",
6789
            "_model_module_version": "1.5.0",
6790
            "_model_name": "FloatProgressModel",
6791
            "_view_count": null,
6792
            "_view_module": "@jupyter-widgets/controls",
6793
            "_view_module_version": "1.5.0",
6794
            "_view_name": "ProgressView",
6795
            "bar_style": "success",
6796
            "description": "",
6797
            "description_tooltip": null,
6798
            "layout": "IPY_MODEL_889a67c857fe40c89d0d8e523a66ae08",
6799
            "max": 2114924,
6800
            "min": 0,
6801
            "orientation": "horizontal",
6802
            "style": "IPY_MODEL_f66ce8552d5d4355b90e934a1c8c04cd",
6803
            "value": 2114924
6804
          }
6805
        },
6806
        "f1d7c8a0a78041b184d64a69f7ed0789": {
6807
          "model_module": "@jupyter-widgets/controls",
6808
          "model_name": "HTMLModel",
6809
          "model_module_version": "1.5.0",
6810
          "state": {
6811
            "_dom_classes": [],
6812
            "_model_module": "@jupyter-widgets/controls",
6813
            "_model_module_version": "1.5.0",
6814
            "_model_name": "HTMLModel",
6815
            "_view_count": null,
6816
            "_view_module": "@jupyter-widgets/controls",
6817
            "_view_module_version": "1.5.0",
6818
            "_view_name": "HTMLView",
6819
            "description": "",
6820
            "description_tooltip": null,
6821
            "layout": "IPY_MODEL_0c3a38f76e6841a38f7a0e545c9c4211",
6822
            "placeholder": "​",
6823
            "style": "IPY_MODEL_e75c5a29c59747dda108212a336c7e2c",
6824
            "value": " 2.11M/2.11M [00:00&lt;00:00, 26.6MB/s]"
6825
          }
6826
        },
6827
        "f4ca5f16039b4258b9c83768d211e757": {
6828
          "model_module": "@jupyter-widgets/base",
6829
          "model_name": "LayoutModel",
6830
          "model_module_version": "1.2.0",
6831
          "state": {
6832
            "_model_module": "@jupyter-widgets/base",
6833
            "_model_module_version": "1.2.0",
6834
            "_model_name": "LayoutModel",
6835
            "_view_count": null,
6836
            "_view_module": "@jupyter-widgets/base",
6837
            "_view_module_version": "1.2.0",
6838
            "_view_name": "LayoutView",
6839
            "align_content": null,
6840
            "align_items": null,
6841
            "align_self": null,
6842
            "border": null,
6843
            "bottom": null,
6844
            "display": null,
6845
            "flex": null,
6846
            "flex_flow": null,
6847
            "grid_area": null,
6848
            "grid_auto_columns": null,
6849
            "grid_auto_flow": null,
6850
            "grid_auto_rows": null,
6851
            "grid_column": null,
6852
            "grid_gap": null,
6853
            "grid_row": null,
6854
            "grid_template_areas": null,
6855
            "grid_template_columns": null,
6856
            "grid_template_rows": null,
6857
            "height": null,
6858
            "justify_content": null,
6859
            "justify_items": null,
6860
            "left": null,
6861
            "margin": null,
6862
            "max_height": null,
6863
            "max_width": null,
6864
            "min_height": null,
6865
            "min_width": null,
6866
            "object_fit": null,
6867
            "object_position": null,
6868
            "order": null,
6869
            "overflow": null,
6870
            "overflow_x": null,
6871
            "overflow_y": null,
6872
            "padding": null,
6873
            "right": null,
6874
            "top": null,
6875
            "visibility": null,
6876
            "width": null
6877
          }
6878
        },
6879
        "864288a708f545629900a29fb05f3d8b": {
6880
          "model_module": "@jupyter-widgets/base",
6881
          "model_name": "LayoutModel",
6882
          "model_module_version": "1.2.0",
6883
          "state": {
6884
            "_model_module": "@jupyter-widgets/base",
6885
            "_model_module_version": "1.2.0",
6886
            "_model_name": "LayoutModel",
6887
            "_view_count": null,
6888
            "_view_module": "@jupyter-widgets/base",
6889
            "_view_module_version": "1.2.0",
6890
            "_view_name": "LayoutView",
6891
            "align_content": null,
6892
            "align_items": null,
6893
            "align_self": null,
6894
            "border": null,
6895
            "bottom": null,
6896
            "display": null,
6897
            "flex": null,
6898
            "flex_flow": null,
6899
            "grid_area": null,
6900
            "grid_auto_columns": null,
6901
            "grid_auto_flow": null,
6902
            "grid_auto_rows": null,
6903
            "grid_column": null,
6904
            "grid_gap": null,
6905
            "grid_row": null,
6906
            "grid_template_areas": null,
6907
            "grid_template_columns": null,
6908
            "grid_template_rows": null,
6909
            "height": null,
6910
            "justify_content": null,
6911
            "justify_items": null,
6912
            "left": null,
6913
            "margin": null,
6914
            "max_height": null,
6915
            "max_width": null,
6916
            "min_height": null,
6917
            "min_width": null,
6918
            "object_fit": null,
6919
            "object_position": null,
6920
            "order": null,
6921
            "overflow": null,
6922
            "overflow_x": null,
6923
            "overflow_y": null,
6924
            "padding": null,
6925
            "right": null,
6926
            "top": null,
6927
            "visibility": null,
6928
            "width": null
6929
          }
6930
        },
6931
        "746c0bfc3d90446ca10a16d7838441aa": {
6932
          "model_module": "@jupyter-widgets/controls",
6933
          "model_name": "DescriptionStyleModel",
6934
          "model_module_version": "1.5.0",
6935
          "state": {
6936
            "_model_module": "@jupyter-widgets/controls",
6937
            "_model_module_version": "1.5.0",
6938
            "_model_name": "DescriptionStyleModel",
6939
            "_view_count": null,
6940
            "_view_module": "@jupyter-widgets/base",
6941
            "_view_module_version": "1.2.0",
6942
            "_view_name": "StyleView",
6943
            "description_width": ""
6944
          }
6945
        },
6946
        "889a67c857fe40c89d0d8e523a66ae08": {
6947
          "model_module": "@jupyter-widgets/base",
6948
          "model_name": "LayoutModel",
6949
          "model_module_version": "1.2.0",
6950
          "state": {
6951
            "_model_module": "@jupyter-widgets/base",
6952
            "_model_module_version": "1.2.0",
6953
            "_model_name": "LayoutModel",
6954
            "_view_count": null,
6955
            "_view_module": "@jupyter-widgets/base",
6956
            "_view_module_version": "1.2.0",
6957
            "_view_name": "LayoutView",
6958
            "align_content": null,
6959
            "align_items": null,
6960
            "align_self": null,
6961
            "border": null,
6962
            "bottom": null,
6963
            "display": null,
6964
            "flex": null,
6965
            "flex_flow": null,
6966
            "grid_area": null,
6967
            "grid_auto_columns": null,
6968
            "grid_auto_flow": null,
6969
            "grid_auto_rows": null,
6970
            "grid_column": null,
6971
            "grid_gap": null,
6972
            "grid_row": null,
6973
            "grid_template_areas": null,
6974
            "grid_template_columns": null,
6975
            "grid_template_rows": null,
6976
            "height": null,
6977
            "justify_content": null,
6978
            "justify_items": null,
6979
            "left": null,
6980
            "margin": null,
6981
            "max_height": null,
6982
            "max_width": null,
6983
            "min_height": null,
6984
            "min_width": null,
6985
            "object_fit": null,
6986
            "object_position": null,
6987
            "order": null,
6988
            "overflow": null,
6989
            "overflow_x": null,
6990
            "overflow_y": null,
6991
            "padding": null,
6992
            "right": null,
6993
            "top": null,
6994
            "visibility": null,
6995
            "width": null
6996
          }
6997
        },
6998
        "f66ce8552d5d4355b90e934a1c8c04cd": {
6999
          "model_module": "@jupyter-widgets/controls",
7000
          "model_name": "ProgressStyleModel",
7001
          "model_module_version": "1.5.0",
7002
          "state": {
7003
            "_model_module": "@jupyter-widgets/controls",
7004
            "_model_module_version": "1.5.0",
7005
            "_model_name": "ProgressStyleModel",
7006
            "_view_count": null,
7007
            "_view_module": "@jupyter-widgets/base",
7008
            "_view_module_version": "1.2.0",
7009
            "_view_name": "StyleView",
7010
            "bar_color": null,
7011
            "description_width": ""
7012
          }
7013
        },
7014
        "0c3a38f76e6841a38f7a0e545c9c4211": {
7015
          "model_module": "@jupyter-widgets/base",
7016
          "model_name": "LayoutModel",
7017
          "model_module_version": "1.2.0",
7018
          "state": {
7019
            "_model_module": "@jupyter-widgets/base",
7020
            "_model_module_version": "1.2.0",
7021
            "_model_name": "LayoutModel",
7022
            "_view_count": null,
7023
            "_view_module": "@jupyter-widgets/base",
7024
            "_view_module_version": "1.2.0",
7025
            "_view_name": "LayoutView",
7026
            "align_content": null,
7027
            "align_items": null,
7028
            "align_self": null,
7029
            "border": null,
7030
            "bottom": null,
7031
            "display": null,
7032
            "flex": null,
7033
            "flex_flow": null,
7034
            "grid_area": null,
7035
            "grid_auto_columns": null,
7036
            "grid_auto_flow": null,
7037
            "grid_auto_rows": null,
7038
            "grid_column": null,
7039
            "grid_gap": null,
7040
            "grid_row": null,
7041
            "grid_template_areas": null,
7042
            "grid_template_columns": null,
7043
            "grid_template_rows": null,
7044
            "height": null,
7045
            "justify_content": null,
7046
            "justify_items": null,
7047
            "left": null,
7048
            "margin": null,
7049
            "max_height": null,
7050
            "max_width": null,
7051
            "min_height": null,
7052
            "min_width": null,
7053
            "object_fit": null,
7054
            "object_position": null,
7055
            "order": null,
7056
            "overflow": null,
7057
            "overflow_x": null,
7058
            "overflow_y": null,
7059
            "padding": null,
7060
            "right": null,
7061
            "top": null,
7062
            "visibility": null,
7063
            "width": null
7064
          }
7065
        },
7066
        "e75c5a29c59747dda108212a336c7e2c": {
7067
          "model_module": "@jupyter-widgets/controls",
7068
          "model_name": "DescriptionStyleModel",
7069
          "model_module_version": "1.5.0",
7070
          "state": {
7071
            "_model_module": "@jupyter-widgets/controls",
7072
            "_model_module_version": "1.5.0",
7073
            "_model_name": "DescriptionStyleModel",
7074
            "_view_count": null,
7075
            "_view_module": "@jupyter-widgets/base",
7076
            "_view_module_version": "1.2.0",
7077
            "_view_name": "StyleView",
7078
            "description_width": ""
7079
          }
7080
        },
7081
        "ce6b953129c945c7a7066d0f07385c92": {
7082
          "model_module": "@jupyter-widgets/controls",
7083
          "model_name": "HBoxModel",
7084
          "model_module_version": "1.5.0",
7085
          "state": {
7086
            "_dom_classes": [],
7087
            "_model_module": "@jupyter-widgets/controls",
7088
            "_model_module_version": "1.5.0",
7089
            "_model_name": "HBoxModel",
7090
            "_view_count": null,
7091
            "_view_module": "@jupyter-widgets/controls",
7092
            "_view_module_version": "1.5.0",
7093
            "_view_name": "HBoxView",
7094
            "box_style": "",
7095
            "children": [
7096
              "IPY_MODEL_6c5a70913c6542be93085a3eefb2b1ce",
7097
              "IPY_MODEL_bd5a93537e9d49ec86233397c0ec2a6f",
7098
              "IPY_MODEL_36fad39ecf0347079291103b73c3f6dd"
7099
            ],
7100
            "layout": "IPY_MODEL_14f4fc13863648599cef5b830ab1bd9f"
7101
          }
7102
        },
7103
        "6c5a70913c6542be93085a3eefb2b1ce": {
7104
          "model_module": "@jupyter-widgets/controls",
7105
          "model_name": "HTMLModel",
7106
          "model_module_version": "1.5.0",
7107
          "state": {
7108
            "_dom_classes": [],
7109
            "_model_module": "@jupyter-widgets/controls",
7110
            "_model_module_version": "1.5.0",
7111
            "_model_name": "HTMLModel",
7112
            "_view_count": null,
7113
            "_view_module": "@jupyter-widgets/controls",
7114
            "_view_module_version": "1.5.0",
7115
            "_view_name": "HTMLView",
7116
            "description": "",
7117
            "description_tooltip": null,
7118
            "layout": "IPY_MODEL_4212106d48a34279a45890b62879ec87",
7119
            "placeholder": "​",
7120
            "style": "IPY_MODEL_2bee159b595643619607aa10b45c186f",
7121
            "value": "Downloading (…)in/added_tokens.json: 100%"
7122
          }
7123
        },
7124
        "bd5a93537e9d49ec86233397c0ec2a6f": {
7125
          "model_module": "@jupyter-widgets/controls",
7126
          "model_name": "FloatProgressModel",
7127
          "model_module_version": "1.5.0",
7128
          "state": {
7129
            "_dom_classes": [],
7130
            "_model_module": "@jupyter-widgets/controls",
7131
            "_model_module_version": "1.5.0",
7132
            "_model_name": "FloatProgressModel",
7133
            "_view_count": null,
7134
            "_view_module": "@jupyter-widgets/controls",
7135
            "_view_module_version": "1.5.0",
7136
            "_view_name": "ProgressView",
7137
            "bar_style": "success",
7138
            "description": "",
7139
            "description_tooltip": null,
7140
            "layout": "IPY_MODEL_c2502539d4eb413da194fae615d6e6bf",
7141
            "max": 1080,
7142
            "min": 0,
7143
            "orientation": "horizontal",
7144
            "style": "IPY_MODEL_95ab78e1349d466d90df3390c0a6ceff",
7145
            "value": 1080
7146
          }
7147
        },
7148
        "36fad39ecf0347079291103b73c3f6dd": {
7149
          "model_module": "@jupyter-widgets/controls",
7150
          "model_name": "HTMLModel",
7151
          "model_module_version": "1.5.0",
7152
          "state": {
7153
            "_dom_classes": [],
7154
            "_model_module": "@jupyter-widgets/controls",
7155
            "_model_module_version": "1.5.0",
7156
            "_model_name": "HTMLModel",
7157
            "_view_count": null,
7158
            "_view_module": "@jupyter-widgets/controls",
7159
            "_view_module_version": "1.5.0",
7160
            "_view_name": "HTMLView",
7161
            "description": "",
7162
            "description_tooltip": null,
7163
            "layout": "IPY_MODEL_9ca4b24b9dbb4b5a9af5897c46069c49",
7164
            "placeholder": "​",
7165
            "style": "IPY_MODEL_5e5449f0eda34f29903b59ca07ac189f",
7166
            "value": " 1.08k/1.08k [00:00&lt;00:00, 72.4kB/s]"
7167
          }
7168
        },
7169
        "14f4fc13863648599cef5b830ab1bd9f": {
7170
          "model_module": "@jupyter-widgets/base",
7171
          "model_name": "LayoutModel",
7172
          "model_module_version": "1.2.0",
7173
          "state": {
7174
            "_model_module": "@jupyter-widgets/base",
7175
            "_model_module_version": "1.2.0",
7176
            "_model_name": "LayoutModel",
7177
            "_view_count": null,
7178
            "_view_module": "@jupyter-widgets/base",
7179
            "_view_module_version": "1.2.0",
7180
            "_view_name": "LayoutView",
7181
            "align_content": null,
7182
            "align_items": null,
7183
            "align_self": null,
7184
            "border": null,
7185
            "bottom": null,
7186
            "display": null,
7187
            "flex": null,
7188
            "flex_flow": null,
7189
            "grid_area": null,
7190
            "grid_auto_columns": null,
7191
            "grid_auto_flow": null,
7192
            "grid_auto_rows": null,
7193
            "grid_column": null,
7194
            "grid_gap": null,
7195
            "grid_row": null,
7196
            "grid_template_areas": null,
7197
            "grid_template_columns": null,
7198
            "grid_template_rows": null,
7199
            "height": null,
7200
            "justify_content": null,
7201
            "justify_items": null,
7202
            "left": null,
7203
            "margin": null,
7204
            "max_height": null,
7205
            "max_width": null,
7206
            "min_height": null,
7207
            "min_width": null,
7208
            "object_fit": null,
7209
            "object_position": null,
7210
            "order": null,
7211
            "overflow": null,
7212
            "overflow_x": null,
7213
            "overflow_y": null,
7214
            "padding": null,
7215
            "right": null,
7216
            "top": null,
7217
            "visibility": null,
7218
            "width": null
7219
          }
7220
        },
7221
        "4212106d48a34279a45890b62879ec87": {
7222
          "model_module": "@jupyter-widgets/base",
7223
          "model_name": "LayoutModel",
7224
          "model_module_version": "1.2.0",
7225
          "state": {
7226
            "_model_module": "@jupyter-widgets/base",
7227
            "_model_module_version": "1.2.0",
7228
            "_model_name": "LayoutModel",
7229
            "_view_count": null,
7230
            "_view_module": "@jupyter-widgets/base",
7231
            "_view_module_version": "1.2.0",
7232
            "_view_name": "LayoutView",
7233
            "align_content": null,
7234
            "align_items": null,
7235
            "align_self": null,
7236
            "border": null,
7237
            "bottom": null,
7238
            "display": null,
7239
            "flex": null,
7240
            "flex_flow": null,
7241
            "grid_area": null,
7242
            "grid_auto_columns": null,
7243
            "grid_auto_flow": null,
7244
            "grid_auto_rows": null,
7245
            "grid_column": null,
7246
            "grid_gap": null,
7247
            "grid_row": null,
7248
            "grid_template_areas": null,
7249
            "grid_template_columns": null,
7250
            "grid_template_rows": null,
7251
            "height": null,
7252
            "justify_content": null,
7253
            "justify_items": null,
7254
            "left": null,
7255
            "margin": null,
7256
            "max_height": null,
7257
            "max_width": null,
7258
            "min_height": null,
7259
            "min_width": null,
7260
            "object_fit": null,
7261
            "object_position": null,
7262
            "order": null,
7263
            "overflow": null,
7264
            "overflow_x": null,
7265
            "overflow_y": null,
7266
            "padding": null,
7267
            "right": null,
7268
            "top": null,
7269
            "visibility": null,
7270
            "width": null
7271
          }
7272
        },
7273
        "2bee159b595643619607aa10b45c186f": {
7274
          "model_module": "@jupyter-widgets/controls",
7275
          "model_name": "DescriptionStyleModel",
7276
          "model_module_version": "1.5.0",
7277
          "state": {
7278
            "_model_module": "@jupyter-widgets/controls",
7279
            "_model_module_version": "1.5.0",
7280
            "_model_name": "DescriptionStyleModel",
7281
            "_view_count": null,
7282
            "_view_module": "@jupyter-widgets/base",
7283
            "_view_module_version": "1.2.0",
7284
            "_view_name": "StyleView",
7285
            "description_width": ""
7286
          }
7287
        },
7288
        "c2502539d4eb413da194fae615d6e6bf": {
7289
          "model_module": "@jupyter-widgets/base",
7290
          "model_name": "LayoutModel",
7291
          "model_module_version": "1.2.0",
7292
          "state": {
7293
            "_model_module": "@jupyter-widgets/base",
7294
            "_model_module_version": "1.2.0",
7295
            "_model_name": "LayoutModel",
7296
            "_view_count": null,
7297
            "_view_module": "@jupyter-widgets/base",
7298
            "_view_module_version": "1.2.0",
7299
            "_view_name": "LayoutView",
7300
            "align_content": null,
7301
            "align_items": null,
7302
            "align_self": null,
7303
            "border": null,
7304
            "bottom": null,
7305
            "display": null,
7306
            "flex": null,
7307
            "flex_flow": null,
7308
            "grid_area": null,
7309
            "grid_auto_columns": null,
7310
            "grid_auto_flow": null,
7311
            "grid_auto_rows": null,
7312
            "grid_column": null,
7313
            "grid_gap": null,
7314
            "grid_row": null,
7315
            "grid_template_areas": null,
7316
            "grid_template_columns": null,
7317
            "grid_template_rows": null,
7318
            "height": null,
7319
            "justify_content": null,
7320
            "justify_items": null,
7321
            "left": null,
7322
            "margin": null,
7323
            "max_height": null,
7324
            "max_width": null,
7325
            "min_height": null,
7326
            "min_width": null,
7327
            "object_fit": null,
7328
            "object_position": null,
7329
            "order": null,
7330
            "overflow": null,
7331
            "overflow_x": null,
7332
            "overflow_y": null,
7333
            "padding": null,
7334
            "right": null,
7335
            "top": null,
7336
            "visibility": null,
7337
            "width": null
7338
          }
7339
        },
7340
        "95ab78e1349d466d90df3390c0a6ceff": {
7341
          "model_module": "@jupyter-widgets/controls",
7342
          "model_name": "ProgressStyleModel",
7343
          "model_module_version": "1.5.0",
7344
          "state": {
7345
            "_model_module": "@jupyter-widgets/controls",
7346
            "_model_module_version": "1.5.0",
7347
            "_model_name": "ProgressStyleModel",
7348
            "_view_count": null,
7349
            "_view_module": "@jupyter-widgets/base",
7350
            "_view_module_version": "1.2.0",
7351
            "_view_name": "StyleView",
7352
            "bar_color": null,
7353
            "description_width": ""
7354
          }
7355
        },
7356
        "9ca4b24b9dbb4b5a9af5897c46069c49": {
7357
          "model_module": "@jupyter-widgets/base",
7358
          "model_name": "LayoutModel",
7359
          "model_module_version": "1.2.0",
7360
          "state": {
7361
            "_model_module": "@jupyter-widgets/base",
7362
            "_model_module_version": "1.2.0",
7363
            "_model_name": "LayoutModel",
7364
            "_view_count": null,
7365
            "_view_module": "@jupyter-widgets/base",
7366
            "_view_module_version": "1.2.0",
7367
            "_view_name": "LayoutView",
7368
            "align_content": null,
7369
            "align_items": null,
7370
            "align_self": null,
7371
            "border": null,
7372
            "bottom": null,
7373
            "display": null,
7374
            "flex": null,
7375
            "flex_flow": null,
7376
            "grid_area": null,
7377
            "grid_auto_columns": null,
7378
            "grid_auto_flow": null,
7379
            "grid_auto_rows": null,
7380
            "grid_column": null,
7381
            "grid_gap": null,
7382
            "grid_row": null,
7383
            "grid_template_areas": null,
7384
            "grid_template_columns": null,
7385
            "grid_template_rows": null,
7386
            "height": null,
7387
            "justify_content": null,
7388
            "justify_items": null,
7389
            "left": null,
7390
            "margin": null,
7391
            "max_height": null,
7392
            "max_width": null,
7393
            "min_height": null,
7394
            "min_width": null,
7395
            "object_fit": null,
7396
            "object_position": null,
7397
            "order": null,
7398
            "overflow": null,
7399
            "overflow_x": null,
7400
            "overflow_y": null,
7401
            "padding": null,
7402
            "right": null,
7403
            "top": null,
7404
            "visibility": null,
7405
            "width": null
7406
          }
7407
        },
7408
        "5e5449f0eda34f29903b59ca07ac189f": {
7409
          "model_module": "@jupyter-widgets/controls",
7410
          "model_name": "DescriptionStyleModel",
7411
          "model_module_version": "1.5.0",
7412
          "state": {
7413
            "_model_module": "@jupyter-widgets/controls",
7414
            "_model_module_version": "1.5.0",
7415
            "_model_name": "DescriptionStyleModel",
7416
            "_view_count": null,
7417
            "_view_module": "@jupyter-widgets/base",
7418
            "_view_module_version": "1.2.0",
7419
            "_view_name": "StyleView",
7420
            "description_width": ""
7421
          }
7422
        },
7423
        "cae6be4ca33c48acb53cfcad9cbad985": {
7424
          "model_module": "@jupyter-widgets/controls",
7425
          "model_name": "HBoxModel",
7426
          "model_module_version": "1.5.0",
7427
          "state": {
7428
            "_dom_classes": [],
7429
            "_model_module": "@jupyter-widgets/controls",
7430
            "_model_module_version": "1.5.0",
7431
            "_model_name": "HBoxModel",
7432
            "_view_count": null,
7433
            "_view_module": "@jupyter-widgets/controls",
7434
            "_view_module_version": "1.5.0",
7435
            "_view_name": "HBoxView",
7436
            "box_style": "",
7437
            "children": [
7438
              "IPY_MODEL_985bd9a745764ceab05a8e665eefe591",
7439
              "IPY_MODEL_548672800a5b4e5ca72df6d63e01f9d3",
7440
              "IPY_MODEL_62b898efd2ed4810bc8bc7de4e7feebf"
7441
            ],
7442
            "layout": "IPY_MODEL_8de7a61d323e4914901a7cf62a916a07"
7443
          }
7444
        },
7445
        "985bd9a745764ceab05a8e665eefe591": {
7446
          "model_module": "@jupyter-widgets/controls",
7447
          "model_name": "HTMLModel",
7448
          "model_module_version": "1.5.0",
7449
          "state": {
7450
            "_dom_classes": [],
7451
            "_model_module": "@jupyter-widgets/controls",
7452
            "_model_module_version": "1.5.0",
7453
            "_model_name": "HTMLModel",
7454
            "_view_count": null,
7455
            "_view_module": "@jupyter-widgets/controls",
7456
            "_view_module_version": "1.5.0",
7457
            "_view_name": "HTMLView",
7458
            "description": "",
7459
            "description_tooltip": null,
7460
            "layout": "IPY_MODEL_9ee95e5cee6d444588116346f6acedf2",
7461
            "placeholder": "​",
7462
            "style": "IPY_MODEL_9baed57a94ed47e493fa23eb65c2526b",
7463
            "value": "Downloading (…)cial_tokens_map.json: 100%"
7464
          }
7465
        },
7466
        "548672800a5b4e5ca72df6d63e01f9d3": {
7467
          "model_module": "@jupyter-widgets/controls",
7468
          "model_name": "FloatProgressModel",
7469
          "model_module_version": "1.5.0",
7470
          "state": {
7471
            "_dom_classes": [],
7472
            "_model_module": "@jupyter-widgets/controls",
7473
            "_model_module_version": "1.5.0",
7474
            "_model_name": "FloatProgressModel",
7475
            "_view_count": null,
7476
            "_view_module": "@jupyter-widgets/controls",
7477
            "_view_module_version": "1.5.0",
7478
            "_view_name": "ProgressView",
7479
            "bar_style": "success",
7480
            "description": "",
7481
            "description_tooltip": null,
7482
            "layout": "IPY_MODEL_1f3a418ebb47456ea041d7b5b3cf85d5",
7483
            "max": 99,
7484
            "min": 0,
7485
            "orientation": "horizontal",
7486
            "style": "IPY_MODEL_fc0ff589460d47e5b97f745b748dd136",
7487
            "value": 99
7488
          }
7489
        },
7490
        "62b898efd2ed4810bc8bc7de4e7feebf": {
7491
          "model_module": "@jupyter-widgets/controls",
7492
          "model_name": "HTMLModel",
7493
          "model_module_version": "1.5.0",
7494
          "state": {
7495
            "_dom_classes": [],
7496
            "_model_module": "@jupyter-widgets/controls",
7497
            "_model_module_version": "1.5.0",
7498
            "_model_name": "HTMLModel",
7499
            "_view_count": null,
7500
            "_view_module": "@jupyter-widgets/controls",
7501
            "_view_module_version": "1.5.0",
7502
            "_view_name": "HTMLView",
7503
            "description": "",
7504
            "description_tooltip": null,
7505
            "layout": "IPY_MODEL_b55ef28dff8b4b14b5b2cbf0438f8e44",
7506
            "placeholder": "​",
7507
            "style": "IPY_MODEL_8be7a69bd51b448da2111a21822b7482",
7508
            "value": " 99.0/99.0 [00:00&lt;00:00, 7.34kB/s]"
7509
          }
7510
        },
7511
        "8de7a61d323e4914901a7cf62a916a07": {
7512
          "model_module": "@jupyter-widgets/base",
7513
          "model_name": "LayoutModel",
7514
          "model_module_version": "1.2.0",
7515
          "state": {
7516
            "_model_module": "@jupyter-widgets/base",
7517
            "_model_module_version": "1.2.0",
7518
            "_model_name": "LayoutModel",
7519
            "_view_count": null,
7520
            "_view_module": "@jupyter-widgets/base",
7521
            "_view_module_version": "1.2.0",
7522
            "_view_name": "LayoutView",
7523
            "align_content": null,
7524
            "align_items": null,
7525
            "align_self": null,
7526
            "border": null,
7527
            "bottom": null,
7528
            "display": null,
7529
            "flex": null,
7530
            "flex_flow": null,
7531
            "grid_area": null,
7532
            "grid_auto_columns": null,
7533
            "grid_auto_flow": null,
7534
            "grid_auto_rows": null,
7535
            "grid_column": null,
7536
            "grid_gap": null,
7537
            "grid_row": null,
7538
            "grid_template_areas": null,
7539
            "grid_template_columns": null,
7540
            "grid_template_rows": null,
7541
            "height": null,
7542
            "justify_content": null,
7543
            "justify_items": null,
7544
            "left": null,
7545
            "margin": null,
7546
            "max_height": null,
7547
            "max_width": null,
7548
            "min_height": null,
7549
            "min_width": null,
7550
            "object_fit": null,
7551
            "object_position": null,
7552
            "order": null,
7553
            "overflow": null,
7554
            "overflow_x": null,
7555
            "overflow_y": null,
7556
            "padding": null,
7557
            "right": null,
7558
            "top": null,
7559
            "visibility": null,
7560
            "width": null
7561
          }
7562
        },
7563
        "9ee95e5cee6d444588116346f6acedf2": {
7564
          "model_module": "@jupyter-widgets/base",
7565
          "model_name": "LayoutModel",
7566
          "model_module_version": "1.2.0",
7567
          "state": {
7568
            "_model_module": "@jupyter-widgets/base",
7569
            "_model_module_version": "1.2.0",
7570
            "_model_name": "LayoutModel",
7571
            "_view_count": null,
7572
            "_view_module": "@jupyter-widgets/base",
7573
            "_view_module_version": "1.2.0",
7574
            "_view_name": "LayoutView",
7575
            "align_content": null,
7576
            "align_items": null,
7577
            "align_self": null,
7578
            "border": null,
7579
            "bottom": null,
7580
            "display": null,
7581
            "flex": null,
7582
            "flex_flow": null,
7583
            "grid_area": null,
7584
            "grid_auto_columns": null,
7585
            "grid_auto_flow": null,
7586
            "grid_auto_rows": null,
7587
            "grid_column": null,
7588
            "grid_gap": null,
7589
            "grid_row": null,
7590
            "grid_template_areas": null,
7591
            "grid_template_columns": null,
7592
            "grid_template_rows": null,
7593
            "height": null,
7594
            "justify_content": null,
7595
            "justify_items": null,
7596
            "left": null,
7597
            "margin": null,
7598
            "max_height": null,
7599
            "max_width": null,
7600
            "min_height": null,
7601
            "min_width": null,
7602
            "object_fit": null,
7603
            "object_position": null,
7604
            "order": null,
7605
            "overflow": null,
7606
            "overflow_x": null,
7607
            "overflow_y": null,
7608
            "padding": null,
7609
            "right": null,
7610
            "top": null,
7611
            "visibility": null,
7612
            "width": null
7613
          }
7614
        },
7615
        "9baed57a94ed47e493fa23eb65c2526b": {
7616
          "model_module": "@jupyter-widgets/controls",
7617
          "model_name": "DescriptionStyleModel",
7618
          "model_module_version": "1.5.0",
7619
          "state": {
7620
            "_model_module": "@jupyter-widgets/controls",
7621
            "_model_module_version": "1.5.0",
7622
            "_model_name": "DescriptionStyleModel",
7623
            "_view_count": null,
7624
            "_view_module": "@jupyter-widgets/base",
7625
            "_view_module_version": "1.2.0",
7626
            "_view_name": "StyleView",
7627
            "description_width": ""
7628
          }
7629
        },
7630
        "1f3a418ebb47456ea041d7b5b3cf85d5": {
7631
          "model_module": "@jupyter-widgets/base",
7632
          "model_name": "LayoutModel",
7633
          "model_module_version": "1.2.0",
7634
          "state": {
7635
            "_model_module": "@jupyter-widgets/base",
7636
            "_model_module_version": "1.2.0",
7637
            "_model_name": "LayoutModel",
7638
            "_view_count": null,
7639
            "_view_module": "@jupyter-widgets/base",
7640
            "_view_module_version": "1.2.0",
7641
            "_view_name": "LayoutView",
7642
            "align_content": null,
7643
            "align_items": null,
7644
            "align_self": null,
7645
            "border": null,
7646
            "bottom": null,
7647
            "display": null,
7648
            "flex": null,
7649
            "flex_flow": null,
7650
            "grid_area": null,
7651
            "grid_auto_columns": null,
7652
            "grid_auto_flow": null,
7653
            "grid_auto_rows": null,
7654
            "grid_column": null,
7655
            "grid_gap": null,
7656
            "grid_row": null,
7657
            "grid_template_areas": null,
7658
            "grid_template_columns": null,
7659
            "grid_template_rows": null,
7660
            "height": null,
7661
            "justify_content": null,
7662
            "justify_items": null,
7663
            "left": null,
7664
            "margin": null,
7665
            "max_height": null,
7666
            "max_width": null,
7667
            "min_height": null,
7668
            "min_width": null,
7669
            "object_fit": null,
7670
            "object_position": null,
7671
            "order": null,
7672
            "overflow": null,
7673
            "overflow_x": null,
7674
            "overflow_y": null,
7675
            "padding": null,
7676
            "right": null,
7677
            "top": null,
7678
            "visibility": null,
7679
            "width": null
7680
          }
7681
        },
7682
        "fc0ff589460d47e5b97f745b748dd136": {
7683
          "model_module": "@jupyter-widgets/controls",
7684
          "model_name": "ProgressStyleModel",
7685
          "model_module_version": "1.5.0",
7686
          "state": {
7687
            "_model_module": "@jupyter-widgets/controls",
7688
            "_model_module_version": "1.5.0",
7689
            "_model_name": "ProgressStyleModel",
7690
            "_view_count": null,
7691
            "_view_module": "@jupyter-widgets/base",
7692
            "_view_module_version": "1.2.0",
7693
            "_view_name": "StyleView",
7694
            "bar_color": null,
7695
            "description_width": ""
7696
          }
7697
        },
7698
        "b55ef28dff8b4b14b5b2cbf0438f8e44": {
7699
          "model_module": "@jupyter-widgets/base",
7700
          "model_name": "LayoutModel",
7701
          "model_module_version": "1.2.0",
7702
          "state": {
7703
            "_model_module": "@jupyter-widgets/base",
7704
            "_model_module_version": "1.2.0",
7705
            "_model_name": "LayoutModel",
7706
            "_view_count": null,
7707
            "_view_module": "@jupyter-widgets/base",
7708
            "_view_module_version": "1.2.0",
7709
            "_view_name": "LayoutView",
7710
            "align_content": null,
7711
            "align_items": null,
7712
            "align_self": null,
7713
            "border": null,
7714
            "bottom": null,
7715
            "display": null,
7716
            "flex": null,
7717
            "flex_flow": null,
7718
            "grid_area": null,
7719
            "grid_auto_columns": null,
7720
            "grid_auto_flow": null,
7721
            "grid_auto_rows": null,
7722
            "grid_column": null,
7723
            "grid_gap": null,
7724
            "grid_row": null,
7725
            "grid_template_areas": null,
7726
            "grid_template_columns": null,
7727
            "grid_template_rows": null,
7728
            "height": null,
7729
            "justify_content": null,
7730
            "justify_items": null,
7731
            "left": null,
7732
            "margin": null,
7733
            "max_height": null,
7734
            "max_width": null,
7735
            "min_height": null,
7736
            "min_width": null,
7737
            "object_fit": null,
7738
            "object_position": null,
7739
            "order": null,
7740
            "overflow": null,
7741
            "overflow_x": null,
7742
            "overflow_y": null,
7743
            "padding": null,
7744
            "right": null,
7745
            "top": null,
7746
            "visibility": null,
7747
            "width": null
7748
          }
7749
        },
7750
        "8be7a69bd51b448da2111a21822b7482": {
7751
          "model_module": "@jupyter-widgets/controls",
7752
          "model_name": "DescriptionStyleModel",
7753
          "model_module_version": "1.5.0",
7754
          "state": {
7755
            "_model_module": "@jupyter-widgets/controls",
7756
            "_model_module_version": "1.5.0",
7757
            "_model_name": "DescriptionStyleModel",
7758
            "_view_count": null,
7759
            "_view_module": "@jupyter-widgets/base",
7760
            "_view_module_version": "1.2.0",
7761
            "_view_name": "StyleView",
7762
            "description_width": ""
7763
          }
7764
        },
7765
        "18d7c57661f54a2f906b86e5b92a356d": {
7766
          "model_module": "@jupyter-widgets/controls",
7767
          "model_name": "HBoxModel",
7768
          "model_module_version": "1.5.0",
7769
          "state": {
7770
            "_dom_classes": [],
7771
            "_model_module": "@jupyter-widgets/controls",
7772
            "_model_module_version": "1.5.0",
7773
            "_model_name": "HBoxModel",
7774
            "_view_count": null,
7775
            "_view_module": "@jupyter-widgets/controls",
7776
            "_view_module_version": "1.5.0",
7777
            "_view_name": "HBoxView",
7778
            "box_style": "",
7779
            "children": [
7780
              "IPY_MODEL_e132669f57024ebcadc1f0d3899fbda2",
7781
              "IPY_MODEL_f3e78fd1331b4463a243475e12bd2480",
7782
              "IPY_MODEL_386c7bc116b849aaa2bd4c8b0c27b0e9"
7783
            ],
7784
            "layout": "IPY_MODEL_4385c5f8fc5d4d179e02ebf65aae4e0f"
7785
          }
7786
        },
7787
        "e132669f57024ebcadc1f0d3899fbda2": {
7788
          "model_module": "@jupyter-widgets/controls",
7789
          "model_name": "HTMLModel",
7790
          "model_module_version": "1.5.0",
7791
          "state": {
7792
            "_dom_classes": [],
7793
            "_model_module": "@jupyter-widgets/controls",
7794
            "_model_module_version": "1.5.0",
7795
            "_model_name": "HTMLModel",
7796
            "_view_count": null,
7797
            "_view_module": "@jupyter-widgets/controls",
7798
            "_view_module_version": "1.5.0",
7799
            "_view_name": "HTMLView",
7800
            "description": "",
7801
            "description_tooltip": null,
7802
            "layout": "IPY_MODEL_59032aea122142da8744876e7d561bca",
7803
            "placeholder": "​",
7804
            "style": "IPY_MODEL_b7bf29e09c554482823942f17fb09217",
7805
            "value": "Downloading (…)/adapter_config.json: 100%"
7806
          }
7807
        },
7808
        "f3e78fd1331b4463a243475e12bd2480": {
7809
          "model_module": "@jupyter-widgets/controls",
7810
          "model_name": "FloatProgressModel",
7811
          "model_module_version": "1.5.0",
7812
          "state": {
7813
            "_dom_classes": [],
7814
            "_model_module": "@jupyter-widgets/controls",
7815
            "_model_module_version": "1.5.0",
7816
            "_model_name": "FloatProgressModel",
7817
            "_view_count": null,
7818
            "_view_module": "@jupyter-widgets/controls",
7819
            "_view_module_version": "1.5.0",
7820
            "_view_name": "ProgressView",
7821
            "bar_style": "success",
7822
            "description": "",
7823
            "description_tooltip": null,
7824
            "layout": "IPY_MODEL_faf28ec7a6304a1d8e52952aff97c6b4",
7825
            "max": 440,
7826
            "min": 0,
7827
            "orientation": "horizontal",
7828
            "style": "IPY_MODEL_f5ed4018421f446da4ff34741a166d38",
7829
            "value": 440
7830
          }
7831
        },
7832
        "386c7bc116b849aaa2bd4c8b0c27b0e9": {
7833
          "model_module": "@jupyter-widgets/controls",
7834
          "model_name": "HTMLModel",
7835
          "model_module_version": "1.5.0",
7836
          "state": {
7837
            "_dom_classes": [],
7838
            "_model_module": "@jupyter-widgets/controls",
7839
            "_model_module_version": "1.5.0",
7840
            "_model_name": "HTMLModel",
7841
            "_view_count": null,
7842
            "_view_module": "@jupyter-widgets/controls",
7843
            "_view_module_version": "1.5.0",
7844
            "_view_name": "HTMLView",
7845
            "description": "",
7846
            "description_tooltip": null,
7847
            "layout": "IPY_MODEL_1919c4500c88418dad25ed0801033031",
7848
            "placeholder": "​",
7849
            "style": "IPY_MODEL_c4a29910b33d4a348ceef13239cf835e",
7850
            "value": " 440/440 [00:00&lt;00:00, 29.5kB/s]"
7851
          }
7852
        },
7853
        "4385c5f8fc5d4d179e02ebf65aae4e0f": {
7854
          "model_module": "@jupyter-widgets/base",
7855
          "model_name": "LayoutModel",
7856
          "model_module_version": "1.2.0",
7857
          "state": {
7858
            "_model_module": "@jupyter-widgets/base",
7859
            "_model_module_version": "1.2.0",
7860
            "_model_name": "LayoutModel",
7861
            "_view_count": null,
7862
            "_view_module": "@jupyter-widgets/base",
7863
            "_view_module_version": "1.2.0",
7864
            "_view_name": "LayoutView",
7865
            "align_content": null,
7866
            "align_items": null,
7867
            "align_self": null,
7868
            "border": null,
7869
            "bottom": null,
7870
            "display": null,
7871
            "flex": null,
7872
            "flex_flow": null,
7873
            "grid_area": null,
7874
            "grid_auto_columns": null,
7875
            "grid_auto_flow": null,
7876
            "grid_auto_rows": null,
7877
            "grid_column": null,
7878
            "grid_gap": null,
7879
            "grid_row": null,
7880
            "grid_template_areas": null,
7881
            "grid_template_columns": null,
7882
            "grid_template_rows": null,
7883
            "height": null,
7884
            "justify_content": null,
7885
            "justify_items": null,
7886
            "left": null,
7887
            "margin": null,
7888
            "max_height": null,
7889
            "max_width": null,
7890
            "min_height": null,
7891
            "min_width": null,
7892
            "object_fit": null,
7893
            "object_position": null,
7894
            "order": null,
7895
            "overflow": null,
7896
            "overflow_x": null,
7897
            "overflow_y": null,
7898
            "padding": null,
7899
            "right": null,
7900
            "top": null,
7901
            "visibility": null,
7902
            "width": null
7903
          }
7904
        },
7905
        "59032aea122142da8744876e7d561bca": {
7906
          "model_module": "@jupyter-widgets/base",
7907
          "model_name": "LayoutModel",
7908
          "model_module_version": "1.2.0",
7909
          "state": {
7910
            "_model_module": "@jupyter-widgets/base",
7911
            "_model_module_version": "1.2.0",
7912
            "_model_name": "LayoutModel",
7913
            "_view_count": null,
7914
            "_view_module": "@jupyter-widgets/base",
7915
            "_view_module_version": "1.2.0",
7916
            "_view_name": "LayoutView",
7917
            "align_content": null,
7918
            "align_items": null,
7919
            "align_self": null,
7920
            "border": null,
7921
            "bottom": null,
7922
            "display": null,
7923
            "flex": null,
7924
            "flex_flow": null,
7925
            "grid_area": null,
7926
            "grid_auto_columns": null,
7927
            "grid_auto_flow": null,
7928
            "grid_auto_rows": null,
7929
            "grid_column": null,
7930
            "grid_gap": null,
7931
            "grid_row": null,
7932
            "grid_template_areas": null,
7933
            "grid_template_columns": null,
7934
            "grid_template_rows": null,
7935
            "height": null,
7936
            "justify_content": null,
7937
            "justify_items": null,
7938
            "left": null,
7939
            "margin": null,
7940
            "max_height": null,
7941
            "max_width": null,
7942
            "min_height": null,
7943
            "min_width": null,
7944
            "object_fit": null,
7945
            "object_position": null,
7946
            "order": null,
7947
            "overflow": null,
7948
            "overflow_x": null,
7949
            "overflow_y": null,
7950
            "padding": null,
7951
            "right": null,
7952
            "top": null,
7953
            "visibility": null,
7954
            "width": null
7955
          }
7956
        },
7957
        "b7bf29e09c554482823942f17fb09217": {
7958
          "model_module": "@jupyter-widgets/controls",
7959
          "model_name": "DescriptionStyleModel",
7960
          "model_module_version": "1.5.0",
7961
          "state": {
7962
            "_model_module": "@jupyter-widgets/controls",
7963
            "_model_module_version": "1.5.0",
7964
            "_model_name": "DescriptionStyleModel",
7965
            "_view_count": null,
7966
            "_view_module": "@jupyter-widgets/base",
7967
            "_view_module_version": "1.2.0",
7968
            "_view_name": "StyleView",
7969
            "description_width": ""
7970
          }
7971
        },
7972
        "faf28ec7a6304a1d8e52952aff97c6b4": {
7973
          "model_module": "@jupyter-widgets/base",
7974
          "model_name": "LayoutModel",
7975
          "model_module_version": "1.2.0",
7976
          "state": {
7977
            "_model_module": "@jupyter-widgets/base",
7978
            "_model_module_version": "1.2.0",
7979
            "_model_name": "LayoutModel",
7980
            "_view_count": null,
7981
            "_view_module": "@jupyter-widgets/base",
7982
            "_view_module_version": "1.2.0",
7983
            "_view_name": "LayoutView",
7984
            "align_content": null,
7985
            "align_items": null,
7986
            "align_self": null,
7987
            "border": null,
7988
            "bottom": null,
7989
            "display": null,
7990
            "flex": null,
7991
            "flex_flow": null,
7992
            "grid_area": null,
7993
            "grid_auto_columns": null,
7994
            "grid_auto_flow": null,
7995
            "grid_auto_rows": null,
7996
            "grid_column": null,
7997
            "grid_gap": null,
7998
            "grid_row": null,
7999
            "grid_template_areas": null,
8000
            "grid_template_columns": null,
8001
            "grid_template_rows": null,
8002
            "height": null,
8003
            "justify_content": null,
8004
            "justify_items": null,
8005
            "left": null,
8006
            "margin": null,
8007
            "max_height": null,
8008
            "max_width": null,
8009
            "min_height": null,
8010
            "min_width": null,
8011
            "object_fit": null,
8012
            "object_position": null,
8013
            "order": null,
8014
            "overflow": null,
8015
            "overflow_x": null,
8016
            "overflow_y": null,
8017
            "padding": null,
8018
            "right": null,
8019
            "top": null,
8020
            "visibility": null,
8021
            "width": null
8022
          }
8023
        },
8024
        "f5ed4018421f446da4ff34741a166d38": {
8025
          "model_module": "@jupyter-widgets/controls",
8026
          "model_name": "ProgressStyleModel",
8027
          "model_module_version": "1.5.0",
8028
          "state": {
8029
            "_model_module": "@jupyter-widgets/controls",
8030
            "_model_module_version": "1.5.0",
8031
            "_model_name": "ProgressStyleModel",
8032
            "_view_count": null,
8033
            "_view_module": "@jupyter-widgets/base",
8034
            "_view_module_version": "1.2.0",
8035
            "_view_name": "StyleView",
8036
            "bar_color": null,
8037
            "description_width": ""
8038
          }
8039
        },
8040
        "1919c4500c88418dad25ed0801033031": {
8041
          "model_module": "@jupyter-widgets/base",
8042
          "model_name": "LayoutModel",
8043
          "model_module_version": "1.2.0",
8044
          "state": {
8045
            "_model_module": "@jupyter-widgets/base",
8046
            "_model_module_version": "1.2.0",
8047
            "_model_name": "LayoutModel",
8048
            "_view_count": null,
8049
            "_view_module": "@jupyter-widgets/base",
8050
            "_view_module_version": "1.2.0",
8051
            "_view_name": "LayoutView",
8052
            "align_content": null,
8053
            "align_items": null,
8054
            "align_self": null,
8055
            "border": null,
8056
            "bottom": null,
8057
            "display": null,
8058
            "flex": null,
8059
            "flex_flow": null,
8060
            "grid_area": null,
8061
            "grid_auto_columns": null,
8062
            "grid_auto_flow": null,
8063
            "grid_auto_rows": null,
8064
            "grid_column": null,
8065
            "grid_gap": null,
8066
            "grid_row": null,
8067
            "grid_template_areas": null,
8068
            "grid_template_columns": null,
8069
            "grid_template_rows": null,
8070
            "height": null,
8071
            "justify_content": null,
8072
            "justify_items": null,
8073
            "left": null,
8074
            "margin": null,
8075
            "max_height": null,
8076
            "max_width": null,
8077
            "min_height": null,
8078
            "min_width": null,
8079
            "object_fit": null,
8080
            "object_position": null,
8081
            "order": null,
8082
            "overflow": null,
8083
            "overflow_x": null,
8084
            "overflow_y": null,
8085
            "padding": null,
8086
            "right": null,
8087
            "top": null,
8088
            "visibility": null,
8089
            "width": null
8090
          }
8091
        },
8092
        "c4a29910b33d4a348ceef13239cf835e": {
8093
          "model_module": "@jupyter-widgets/controls",
8094
          "model_name": "DescriptionStyleModel",
8095
          "model_module_version": "1.5.0",
8096
          "state": {
8097
            "_model_module": "@jupyter-widgets/controls",
8098
            "_model_module_version": "1.5.0",
8099
            "_model_name": "DescriptionStyleModel",
8100
            "_view_count": null,
8101
            "_view_module": "@jupyter-widgets/base",
8102
            "_view_module_version": "1.2.0",
8103
            "_view_name": "StyleView",
8104
            "description_width": ""
8105
          }
8106
        },
8107
        "31405710033848009cf8227a7611864f": {
8108
          "model_module": "@jupyter-widgets/controls",
8109
          "model_name": "HBoxModel",
8110
          "model_module_version": "1.5.0",
8111
          "state": {
8112
            "_dom_classes": [],
8113
            "_model_module": "@jupyter-widgets/controls",
8114
            "_model_module_version": "1.5.0",
8115
            "_model_name": "HBoxModel",
8116
            "_view_count": null,
8117
            "_view_module": "@jupyter-widgets/controls",
8118
            "_view_module_version": "1.5.0",
8119
            "_view_name": "HBoxView",
8120
            "box_style": "",
8121
            "children": [
8122
              "IPY_MODEL_cc862dc1f8884513b8eefb569ab50424",
8123
              "IPY_MODEL_3cd7c95a507d459f86b9eadd7cfdcb85",
8124
              "IPY_MODEL_683da23b78b54a8eb3c1984cd29bbeb2"
8125
            ],
8126
            "layout": "IPY_MODEL_f022a8aac72d490fb89495f01c929885"
8127
          }
8128
        },
8129
        "cc862dc1f8884513b8eefb569ab50424": {
8130
          "model_module": "@jupyter-widgets/controls",
8131
          "model_name": "HTMLModel",
8132
          "model_module_version": "1.5.0",
8133
          "state": {
8134
            "_dom_classes": [],
8135
            "_model_module": "@jupyter-widgets/controls",
8136
            "_model_module_version": "1.5.0",
8137
            "_model_name": "HTMLModel",
8138
            "_view_count": null,
8139
            "_view_module": "@jupyter-widgets/controls",
8140
            "_view_module_version": "1.5.0",
8141
            "_view_name": "HTMLView",
8142
            "description": "",
8143
            "description_tooltip": null,
8144
            "layout": "IPY_MODEL_ac31ba38940c445e9305623046dc2473",
8145
            "placeholder": "​",
8146
            "style": "IPY_MODEL_1880da50605c435da03377a6e535d3a6",
8147
            "value": "Downloading adapter_model.bin: 100%"
8148
          }
8149
        },
8150
        "3cd7c95a507d459f86b9eadd7cfdcb85": {
8151
          "model_module": "@jupyter-widgets/controls",
8152
          "model_name": "FloatProgressModel",
8153
          "model_module_version": "1.5.0",
8154
          "state": {
8155
            "_dom_classes": [],
8156
            "_model_module": "@jupyter-widgets/controls",
8157
            "_model_module_version": "1.5.0",
8158
            "_model_name": "FloatProgressModel",
8159
            "_view_count": null,
8160
            "_view_module": "@jupyter-widgets/controls",
8161
            "_view_module_version": "1.5.0",
8162
            "_view_name": "ProgressView",
8163
            "bar_style": "success",
8164
            "description": "",
8165
            "description_tooltip": null,
8166
            "layout": "IPY_MODEL_d645078ee2094f37a1bfbaa6727474bb",
8167
            "max": 18907665,
8168
            "min": 0,
8169
            "orientation": "horizontal",
8170
            "style": "IPY_MODEL_a0c4211bdd9e4857b16fbad1d7b1d3e1",
8171
            "value": 18907665
8172
          }
8173
        },
8174
        "683da23b78b54a8eb3c1984cd29bbeb2": {
8175
          "model_module": "@jupyter-widgets/controls",
8176
          "model_name": "HTMLModel",
8177
          "model_module_version": "1.5.0",
8178
          "state": {
8179
            "_dom_classes": [],
8180
            "_model_module": "@jupyter-widgets/controls",
8181
            "_model_module_version": "1.5.0",
8182
            "_model_name": "HTMLModel",
8183
            "_view_count": null,
8184
            "_view_module": "@jupyter-widgets/controls",
8185
            "_view_module_version": "1.5.0",
8186
            "_view_name": "HTMLView",
8187
            "description": "",
8188
            "description_tooltip": null,
8189
            "layout": "IPY_MODEL_3bee676ed0274dee9160f3260f253acf",
8190
            "placeholder": "​",
8191
            "style": "IPY_MODEL_93909168ffc24b5ba6c03a2a067b99c1",
8192
            "value": " 18.9M/18.9M [00:00&lt;00:00, 45.8MB/s]"
8193
          }
8194
        },
8195
        "f022a8aac72d490fb89495f01c929885": {
8196
          "model_module": "@jupyter-widgets/base",
8197
          "model_name": "LayoutModel",
8198
          "model_module_version": "1.2.0",
8199
          "state": {
8200
            "_model_module": "@jupyter-widgets/base",
8201
            "_model_module_version": "1.2.0",
8202
            "_model_name": "LayoutModel",
8203
            "_view_count": null,
8204
            "_view_module": "@jupyter-widgets/base",
8205
            "_view_module_version": "1.2.0",
8206
            "_view_name": "LayoutView",
8207
            "align_content": null,
8208
            "align_items": null,
8209
            "align_self": null,
8210
            "border": null,
8211
            "bottom": null,
8212
            "display": null,
8213
            "flex": null,
8214
            "flex_flow": null,
8215
            "grid_area": null,
8216
            "grid_auto_columns": null,
8217
            "grid_auto_flow": null,
8218
            "grid_auto_rows": null,
8219
            "grid_column": null,
8220
            "grid_gap": null,
8221
            "grid_row": null,
8222
            "grid_template_areas": null,
8223
            "grid_template_columns": null,
8224
            "grid_template_rows": null,
8225
            "height": null,
8226
            "justify_content": null,
8227
            "justify_items": null,
8228
            "left": null,
8229
            "margin": null,
8230
            "max_height": null,
8231
            "max_width": null,
8232
            "min_height": null,
8233
            "min_width": null,
8234
            "object_fit": null,
8235
            "object_position": null,
8236
            "order": null,
8237
            "overflow": null,
8238
            "overflow_x": null,
8239
            "overflow_y": null,
8240
            "padding": null,
8241
            "right": null,
8242
            "top": null,
8243
            "visibility": null,
8244
            "width": null
8245
          }
8246
        },
8247
        "ac31ba38940c445e9305623046dc2473": {
8248
          "model_module": "@jupyter-widgets/base",
8249
          "model_name": "LayoutModel",
8250
          "model_module_version": "1.2.0",
8251
          "state": {
8252
            "_model_module": "@jupyter-widgets/base",
8253
            "_model_module_version": "1.2.0",
8254
            "_model_name": "LayoutModel",
8255
            "_view_count": null,
8256
            "_view_module": "@jupyter-widgets/base",
8257
            "_view_module_version": "1.2.0",
8258
            "_view_name": "LayoutView",
8259
            "align_content": null,
8260
            "align_items": null,
8261
            "align_self": null,
8262
            "border": null,
8263
            "bottom": null,
8264
            "display": null,
8265
            "flex": null,
8266
            "flex_flow": null,
8267
            "grid_area": null,
8268
            "grid_auto_columns": null,
8269
            "grid_auto_flow": null,
8270
            "grid_auto_rows": null,
8271
            "grid_column": null,
8272
            "grid_gap": null,
8273
            "grid_row": null,
8274
            "grid_template_areas": null,
8275
            "grid_template_columns": null,
8276
            "grid_template_rows": null,
8277
            "height": null,
8278
            "justify_content": null,
8279
            "justify_items": null,
8280
            "left": null,
8281
            "margin": null,
8282
            "max_height": null,
8283
            "max_width": null,
8284
            "min_height": null,
8285
            "min_width": null,
8286
            "object_fit": null,
8287
            "object_position": null,
8288
            "order": null,
8289
            "overflow": null,
8290
            "overflow_x": null,
8291
            "overflow_y": null,
8292
            "padding": null,
8293
            "right": null,
8294
            "top": null,
8295
            "visibility": null,
8296
            "width": null
8297
          }
8298
        },
8299
        "1880da50605c435da03377a6e535d3a6": {
8300
          "model_module": "@jupyter-widgets/controls",
8301
          "model_name": "DescriptionStyleModel",
8302
          "model_module_version": "1.5.0",
8303
          "state": {
8304
            "_model_module": "@jupyter-widgets/controls",
8305
            "_model_module_version": "1.5.0",
8306
            "_model_name": "DescriptionStyleModel",
8307
            "_view_count": null,
8308
            "_view_module": "@jupyter-widgets/base",
8309
            "_view_module_version": "1.2.0",
8310
            "_view_name": "StyleView",
8311
            "description_width": ""
8312
          }
8313
        },
8314
        "d645078ee2094f37a1bfbaa6727474bb": {
8315
          "model_module": "@jupyter-widgets/base",
8316
          "model_name": "LayoutModel",
8317
          "model_module_version": "1.2.0",
8318
          "state": {
8319
            "_model_module": "@jupyter-widgets/base",
8320
            "_model_module_version": "1.2.0",
8321
            "_model_name": "LayoutModel",
8322
            "_view_count": null,
8323
            "_view_module": "@jupyter-widgets/base",
8324
            "_view_module_version": "1.2.0",
8325
            "_view_name": "LayoutView",
8326
            "align_content": null,
8327
            "align_items": null,
8328
            "align_self": null,
8329
            "border": null,
8330
            "bottom": null,
8331
            "display": null,
8332
            "flex": null,
8333
            "flex_flow": null,
8334
            "grid_area": null,
8335
            "grid_auto_columns": null,
8336
            "grid_auto_flow": null,
8337
            "grid_auto_rows": null,
8338
            "grid_column": null,
8339
            "grid_gap": null,
8340
            "grid_row": null,
8341
            "grid_template_areas": null,
8342
            "grid_template_columns": null,
8343
            "grid_template_rows": null,
8344
            "height": null,
8345
            "justify_content": null,
8346
            "justify_items": null,
8347
            "left": null,
8348
            "margin": null,
8349
            "max_height": null,
8350
            "max_width": null,
8351
            "min_height": null,
8352
            "min_width": null,
8353
            "object_fit": null,
8354
            "object_position": null,
8355
            "order": null,
8356
            "overflow": null,
8357
            "overflow_x": null,
8358
            "overflow_y": null,
8359
            "padding": null,
8360
            "right": null,
8361
            "top": null,
8362
            "visibility": null,
8363
            "width": null
8364
          }
8365
        },
8366
        "a0c4211bdd9e4857b16fbad1d7b1d3e1": {
8367
          "model_module": "@jupyter-widgets/controls",
8368
          "model_name": "ProgressStyleModel",
8369
          "model_module_version": "1.5.0",
8370
          "state": {
8371
            "_model_module": "@jupyter-widgets/controls",
8372
            "_model_module_version": "1.5.0",
8373
            "_model_name": "ProgressStyleModel",
8374
            "_view_count": null,
8375
            "_view_module": "@jupyter-widgets/base",
8376
            "_view_module_version": "1.2.0",
8377
            "_view_name": "StyleView",
8378
            "bar_color": null,
8379
            "description_width": ""
8380
          }
8381
        },
8382
        "3bee676ed0274dee9160f3260f253acf": {
8383
          "model_module": "@jupyter-widgets/base",
8384
          "model_name": "LayoutModel",
8385
          "model_module_version": "1.2.0",
8386
          "state": {
8387
            "_model_module": "@jupyter-widgets/base",
8388
            "_model_module_version": "1.2.0",
8389
            "_model_name": "LayoutModel",
8390
            "_view_count": null,
8391
            "_view_module": "@jupyter-widgets/base",
8392
            "_view_module_version": "1.2.0",
8393
            "_view_name": "LayoutView",
8394
            "align_content": null,
8395
            "align_items": null,
8396
            "align_self": null,
8397
            "border": null,
8398
            "bottom": null,
8399
            "display": null,
8400
            "flex": null,
8401
            "flex_flow": null,
8402
            "grid_area": null,
8403
            "grid_auto_columns": null,
8404
            "grid_auto_flow": null,
8405
            "grid_auto_rows": null,
8406
            "grid_column": null,
8407
            "grid_gap": null,
8408
            "grid_row": null,
8409
            "grid_template_areas": null,
8410
            "grid_template_columns": null,
8411
            "grid_template_rows": null,
8412
            "height": null,
8413
            "justify_content": null,
8414
            "justify_items": null,
8415
            "left": null,
8416
            "margin": null,
8417
            "max_height": null,
8418
            "max_width": null,
8419
            "min_height": null,
8420
            "min_width": null,
8421
            "object_fit": null,
8422
            "object_position": null,
8423
            "order": null,
8424
            "overflow": null,
8425
            "overflow_x": null,
8426
            "overflow_y": null,
8427
            "padding": null,
8428
            "right": null,
8429
            "top": null,
8430
            "visibility": null,
8431
            "width": null
8432
          }
8433
        },
8434
        "93909168ffc24b5ba6c03a2a067b99c1": {
8435
          "model_module": "@jupyter-widgets/controls",
8436
          "model_name": "DescriptionStyleModel",
8437
          "model_module_version": "1.5.0",
8438
          "state": {
8439
            "_model_module": "@jupyter-widgets/controls",
8440
            "_model_module_version": "1.5.0",
8441
            "_model_name": "DescriptionStyleModel",
8442
            "_view_count": null,
8443
            "_view_module": "@jupyter-widgets/base",
8444
            "_view_module_version": "1.2.0",
8445
            "_view_name": "StyleView",
8446
            "description_width": ""
8447
          }
8448
        }
8449
      }
8450
    }
8451
  },
8452
  "nbformat": 4,
8453
  "nbformat_minor": 0
8454
}

Использование cookies

Мы используем файлы cookie в соответствии с Политикой конфиденциальности и Политикой использования cookies.

Нажимая кнопку «Принимаю», Вы даете АО «СберТех» согласие на обработку Ваших персональных данных в целях совершенствования нашего веб-сайта и Сервиса GitVerse, а также повышения удобства их использования.

Запретить использование cookies Вы можете самостоятельно в настройках Вашего браузера.