diff --git "a/FineTuning_StableCode.ipynb" "b/FineTuning_StableCode.ipynb"
new file mode 100644--- /dev/null
+++ "b/FineTuning_StableCode.ipynb"
@@ -0,0 +1,8058 @@
+{
+ "cells": [
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "metadata": {
+ "id": "kH18jD5cR_Ks",
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ },
+ "outputId": "bab0bba5-68fd-47d0-ea8f-d256c3d1fa15"
+ },
+ "outputs": [
+ {
+ "output_type": "stream",
+ "name": "stdout",
+ "text": [
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m44.1/44.1 kB\u001b[0m \u001b[31m2.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m320.7/320.7 kB\u001b[0m \u001b[31m17.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m122.4/122.4 MB\u001b[0m \u001b[31m7.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m310.9/310.9 kB\u001b[0m \u001b[31m13.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m10.0/10.0 MB\u001b[0m \u001b[31m53.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m480.6/480.6 kB\u001b[0m \u001b[31m24.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m116.3/116.3 kB\u001b[0m \u001b[31m10.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.8/134.8 kB\u001b[0m \u001b[31m8.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m40.0/40.0 MB\u001b[0m \u001b[31m14.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.0/3.0 MB\u001b[0m \u001b[31m43.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m194.1/194.1 kB\u001b[0m \u001b[31m12.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[?25h\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n",
+ "cudf-cu12 24.4.1 requires pyarrow<15.0.0a0,>=14.0.1, but you have pyarrow 18.0.0 which is incompatible.\n",
+ "ibis-framework 8.0.0 requires pyarrow<16,>=2, but you have pyarrow 18.0.0 which is incompatible.\u001b[0m\u001b[31m\n",
+ "\u001b[0m"
+ ]
+ }
+ ],
+ "source": [
+ "# !pip install -q accelerate peft bitsandbytes transformers trl faiss-gpu langchain_community wandb flash-attn\n",
+ "!pip install -q accelerate peft bitsandbytes transformers trl datasets\n",
+ "\n",
+ "# flash-attn"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "metadata": {
+ "id": "cgVNTbBa-D3j"
+ },
+ "outputs": [],
+ "source": [
+ "# load the required packages.\n",
+ "import torch\n",
+ "from datasets import load_dataset, Dataset\n",
+ "from peft import LoraConfig, AutoPeftModelForCausalLM, PeftModel, get_peft_model\n",
+ "from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, TrainingArguments, AutoConfig, set_seed\n",
+ "from trl import SFTTrainer\n",
+ "import bitsandbytes as bnb\n",
+ "import transformers\n",
+ "\n",
+ "import os\n",
+ "import numpy as np\n",
+ "import pandas as pd\n",
+ "import sqlparse\n",
+ "import re\n",
+ "import json\n",
+ "\n",
+ "from huggingface_hub import hf_hub_download\n",
+ "from huggingface_hub import HfFileSystem"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "s7RtbLxPwTx2",
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ },
+ "outputId": "43d5ff02-3e33-439c-e3a9-c18ce99d237d"
+ },
+ "outputs": [
+ {
+ "output_type": "stream",
+ "name": "stdout",
+ "text": [
+ "Mounted at /content/drive\n"
+ ]
+ }
+ ],
+ "source": [
+ "# from google.colab import drive\n",
+ "# from google.colab import userdata\n",
+ "# drive.mount('/content/drive')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "basaX_55Yf_D"
+ },
+ "outputs": [],
+ "source": [
+ "#transformers.logging.set_verbosity_info()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "metadata": {
+ "id": "bkkjgGdlrNcq"
+ },
+ "outputs": [],
+ "source": [
+ "WRITE_TOKEN = userdata.get('hf_write')\n",
+ "READ_TOKEN = userdata.get('hf_read')\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "metadata": {
+ "id": "7CKnwlRfZj4V"
+ },
+ "outputs": [],
+ "source": [
+ "model_name = \"stabilityai/stable-code-instruct-3b\"\n",
+ "out_name = \"lleticiasilvaa/StableCode-text2SQL-schemaReduzidoTabelas\"\n",
+ "prev_checkpoint = None # \"checkpoint-3000\""
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "9zs7nCmt-pMC"
+ },
+ "outputs": [],
+ "source": [
+ "#!huggingface-cli login"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "metadata": {
+ "id": "PZdnxs8k-Cgl"
+ },
+ "outputs": [],
+ "source": [
+ "bird_id=\"NESPED-GEN/bird\"\n",
+ "spider_id=\"NESPED-GEN/spider_selector_schemaReduzido\"\n",
+ "\n",
+ "selector_id = \"NESPED-GEN/selector_testes\""
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "id": "xT2iRdCN_MFH"
+ },
+ "source": [
+ "### Load Data\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "metadata": {
+ "id": "lLKgY40efdJo",
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 281,
+ "referenced_widgets": [
+ "62b5a4803207499da82677b9b146b97b",
+ "1c006910a42e40728867969135b6d848",
+ "1a5af1ef864e41d99a79d5b94d982711",
+ "a84dab2f85094fb3997adb2d3c2ecd0a",
+ "bcc0fee091bb4a308e9c39e2ae091acd",
+ "349dd7e2bfd141a583b8ec25b786cae3",
+ "29717b10d1bd45cba1a785123bd2a0b4",
+ "319f0c7c10c546b3a1be237d93ebf5ae",
+ "7c0a09f10b59412ba4271ba77a1378f0",
+ "ba00c487942a4c50ad032aad072a6f7b",
+ "11d0433884ca4e46b7cb033b5e546ad4",
+ "eb2518b1c019478daec2d2c058898096",
+ "c25c3c6ca8f343c2b7519abca165c779",
+ "207cc561423a413c975d54acfdfd73a4",
+ "d86de6918ba94a159b0c48b33bc9d90c",
+ "22531ea2c5fe493ca2a87b8432424371",
+ "964dfefdf21648a6a2ab33a935efb4e7",
+ "6d9d4727e4734795a65a12306e1db3e9",
+ "cfa5cebbda604836bfb3daf1a0a9eb5b",
+ "bf0121739fac4cab8a6a56f607e99067",
+ "2cf8d94d40d14f9ab02389fe857a44e7",
+ "ca3279d8e8d14ae3958efd4990d760f5",
+ "3b861b5eb85a4eb1a5800dd33e199b88",
+ "f60ecb97d13d4056a7295306b4a726f3",
+ "7ed9c3225ff34256bb3d105a541a2dbb",
+ "8ed8b8ef97fd4b4cbb03f6954fa70367",
+ "4651ad7190a047f98bbf3817e529f9f8",
+ "22d3f097275c42869bc2bc07b70b99f4",
+ "82b145ecd4994698b56223f44c695054",
+ "ec2be65f2cdb476ea1717ef7040f839a",
+ "35c2672c5c8542dd80d92167dd9d9163",
+ "aa21408da1eb4d1bb1a2aa00eedc9412",
+ "938befa273d944d6932eafd292376a7b",
+ "d786b4589eaa4a9d8dd1a17beb71a42c",
+ "3f0ddb4d9e5346b8b6d46e3dd1f5a848",
+ "0ec766ee8a12493492e591aae846821e",
+ "ee72b1d5917e4377b4140d04b6238961",
+ "1a9cdc5f9aa84a3abe8a93d51bda8cf4",
+ "8ba0c5c19e7b40e3b1987a274f04e780",
+ "cad63d5f62d04a0987898969ec0bc4fb",
+ "30a5dcee7cc142ec8a8f6b2888853fab",
+ "69f97bec934b444993afa7056655ee4d",
+ "485a0a650475469686655c0326849223",
+ "bd7f555c54e84745b3ee0bf5d3bbe65f",
+ "5abd0ad065d74e5090902ca9420e9eda",
+ "8dd111f5c4c84ef0b1213a7cf20db429",
+ "563de63f39af4f949944c2bcc79e2f62",
+ "279032b33e64433d8c5ac7d7a1bf4b2b",
+ "a7f20c1db6014748b1c9d567b29bdb76",
+ "7f1157ebb5a04a4bb3c7b83df53fd206",
+ "1c54e6b541dc40038b3d176af7949ee2",
+ "5562393293ea45c1972f520b5740cb08",
+ "42199373c5e747b1a59973878319f8e5",
+ "48ba0bcad819498282222df452525e9e",
+ "3f2265210736450d93657b7e2a6b2785"
+ ]
+ },
+ "outputId": "57b279a5-52e6-4a12-d22a-7fe5769c1e28"
+ },
+ "outputs": [
+ {
+ "output_type": "stream",
+ "name": "stderr",
+ "text": [
+ "/usr/local/lib/python3.10/dist-packages/huggingface_hub/utils/_token.py:89: UserWarning: \n",
+ "The secret `HF_TOKEN` does not exist in your Colab secrets.\n",
+ "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n",
+ "You will be able to reuse this secret in all of your notebooks.\n",
+ "Please note that authentication is recommended but still optional to access public models or datasets.\n",
+ " warnings.warn(\n"
+ ]
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "README.md: 0%| | 0.00/885 [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "62b5a4803207499da82677b9b146b97b"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "dev-00000-of-00001.parquet: 0%| | 0.00/369k [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "eb2518b1c019478daec2d2c058898096"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "train-00000-of-00001.parquet: 0%| | 0.00/2.70M [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "3b861b5eb85a4eb1a5800dd33e199b88"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "Generating dev split: 0%| | 0/1034 [00:00, ? examples/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "d786b4589eaa4a9d8dd1a17beb71a42c"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "Generating train split: 0%| | 0/8656 [00:00, ? examples/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "5abd0ad065d74e5090902ca9420e9eda"
+ }
+ },
+ "metadata": {}
+ }
+ ],
+ "source": [
+ "# bird = load_dataset(bird_id, split=\"train\").to_pandas()\n",
+ "spider = load_dataset(spider_id, split=\"train\").to_pandas()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "D3d_091Ud0BG"
+ },
+ "outputs": [],
+ "source": [
+ "# df = pd.concat([spider, bird], axis=0)\n",
+ "# df = df.fillna('')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "niRTjA1tQIWr"
+ },
+ "outputs": [],
+ "source": [
+ "# df.reset_index(drop=True, inplace=True)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "df = spider"
+ ],
+ "metadata": {
+ "id": "po1gNdLjFKdZ"
+ },
+ "execution_count": 7,
+ "outputs": []
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "#df = load_dataset(selector_id, split=\"trainSpider\").to_pandas()"
+ ],
+ "metadata": {
+ "id": "LeL7EfmQVyBt"
+ },
+ "execution_count": null,
+ "outputs": []
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "id": "ON-hPsEYM1Bu"
+ },
+ "source": [
+ "# Load Base Model"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "metadata": {
+ "id": "yEAZpfzlNOHW"
+ },
+ "outputs": [],
+ "source": [
+ "def download_checkpoint(adapter_model_id, checkpoint):\n",
+ " fs = HfFileSystem()\n",
+ " for file in fs.ls(f'{adapter_model_id}/{checkpoint}', detail=False):\n",
+ " file_name = file.split(checkpoint)[-1]\n",
+ "\n",
+ " hf_hub_download(repo_id=adapter_model_id, filename=(f'{checkpoint}{file_name}'), local_dir='out')\n",
+ "\n",
+ " for file in fs.ls(f'{adapter_model_id}/logs', detail=False):\n",
+ " file_name = file.split(checkpoint)[-1]\n",
+ "\n",
+ " hf_hub_download(repo_id=adapter_model_id, filename=(f'logs/{file_name.split(\"/\")[-1]}'), local_dir='out')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# download_checkpoint(out_name, prev_checkpoint)"
+ ],
+ "metadata": {
+ "id": "enUxjGXEqHxg"
+ },
+ "execution_count": null,
+ "outputs": []
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "metadata": {
+ "id": "M7DoqQMlM_nW",
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 337,
+ "referenced_widgets": [
+ "cf7e01f9046d4c22962a648618ad5f7c",
+ "84c68e15eddf448198c54a22175a6d9f",
+ "ab1cd082922948358849b31b0b692fe8",
+ "5f39764fc13c4a7faf40d12323cfc576",
+ "24a43873ea4a4475aa032f163cc32822",
+ "97bb8763995744c6afc3a93010f7bf26",
+ "81b8562116614219b51c3dfa404f3684",
+ "0458f04bba74415fb420e5f4e50dd80b",
+ "71cc2397a4704f8486624917e47f8c99",
+ "0a7c233068d5420e8fbe3a7bdc749825",
+ "dcbb0e372cdd460b8284e3cce24437ef",
+ "37be9d87487f4a65bb3a553e054a9b9f",
+ "af62d0e253db43e4a5f8fc0399134e33",
+ "45e6842e357d466b88547e967afbce15",
+ "41caf3b8544243ee8080990bcc37f202",
+ "94fabb6c25b140b08dd87fec35836d17",
+ "4b615c1e58ed42238a6ebfefec23914b",
+ "af2d34bfc6994559b9c524f7963a4623",
+ "bdf850ca809641568d696016eb893909",
+ "3ee1870576a747ffa1c87688e45f3e73",
+ "c3b5bb9e533f4e39aff22756d9437f88",
+ "891d8fe057e046f18654f34fe15f097f",
+ "2c3628d3032f43f1a5698b863422be9c",
+ "14a14a1fac1544cb921ef83b10dfad26",
+ "9b726ac9cd324096a730c57a9e306db3",
+ "01059ed672f942b3a11810fd7d990853",
+ "c14ef71f64a240ca913aafc077f3f4b4",
+ "87112b2495a648ca98145db2f05fd164",
+ "0475ba7ffbe54055aecd6e0b62a41eea",
+ "c0240edf852948608aba0016c26fc1cc",
+ "332f7aafae624667896b6ae037033e65",
+ "0ba5fc5f0fed4f2a92e570763fe9514c",
+ "c571fd0656fc4a2292b0496b86f07a36",
+ "a0cb3fa115ef4c2e90618a9fd9249e9c",
+ "f293ba1eea304c43bdd509fe0cc8ec2d",
+ "584d189f4dd142a2a7c3b918b1931317",
+ "0fce315e9869484282dc65a57683326d",
+ "45c356d16449493fba9c25b6b2e1c98c",
+ "9dc83ec606f74b95b830483b7b83e6ab",
+ "d993a4247cb94b1db6df1d285566c8d2",
+ "d860e096167848d0b094c4bd0ba64736",
+ "f15be96d251b486798e6b14b40ae11ec",
+ "b6959704534e47f893acb1680f78de96",
+ "1b8b35c3d62d48c49b1bbdfe3bbece99",
+ "67185d66e50e4578bdabd94304bb673b",
+ "0c8f9ab0f09a4cb2be56c75597b38a0a",
+ "9a3828a9c40e4daba6578feb3cb0a35b",
+ "3f45fde4bd4545ffbdbd1ddbef2ce73e",
+ "4f82b90d6ca945bcb18dac112bc8db7a",
+ "12398d8c1ffb4d74bfdd994048680dd5",
+ "0b0fc0706a9a4f72a20eb8f8eade3193",
+ "740d7936fe2e4bf48d4920a5382087d7",
+ "b8776171b87e47e1a2212377ee796fdd",
+ "ce431e3b540c4b59ac4f8bcc5b7078b6",
+ "b276a81e7a2b4e668381f920c11e8dc9",
+ "1562cb138c5a413c859a701ed5b70dba",
+ "ce568bd1899d4fe7abe491fef73e65a4",
+ "161024aa2e3448e79ba1ba526d92a5ea",
+ "150d10024dea40719982531fcf59d331",
+ "1ffd6a8ce6a94bdc93a0a380facb573e",
+ "8cf991e531204a56a5af81ea2898f704",
+ "c3360cc53a6e42d9af6e2262cf86d051",
+ "c9eec2a0fc6b4edc9c19f231b055ec9b",
+ "44b44e629a0c43199ffa6eee0882c091",
+ "74ba3634127e4b9185b25e48ba7ebe3a",
+ "dbf30f5fe7214c129d324bdca133973a",
+ "0631ef1ac59a40dcb194ea0bf2ba94b6",
+ "fcfd184cac4a465cbd14acc875e0aae2",
+ "8b3ee7c84008414797145b48495f4b5a",
+ "5107bfef46f54ed497b67cd94a714487",
+ "d500ad0d5e7b40d8896ce43379326591",
+ "5ab9e4d9c0b44b8b9a840237e2c01aa3",
+ "ffbe40c06c804f18ba8c0558ff9438ba",
+ "fdbc178bbc134dbbb10a4b023db47fb5",
+ "41bd2e1851684ba0927297ee3319c50a",
+ "20f84060e82842ae96702084c1f8a82b",
+ "61a698c2dcba4f07a814ac567d4bc256",
+ "252f7db506bb41ec986f88ea4d5d4d36",
+ "87b052bf69844867919c0d1de6754046",
+ "ab236cd071364387b3ed3ea97c8e3b4d",
+ "b3a1e5e7bad542f3974e4e067ed76640",
+ "168fac509c8b4b3c9b03e7ee13f8dd52",
+ "b32729d9635e406884a8345ce61ad536",
+ "a9d45e528eb243ba81124e8641812001",
+ "7c99dc6dd7834c7b9c7b96d9e690b49f",
+ "7ad156904fc54b3187dd7fa260ee40dc",
+ "6b4d66c9cc3c4285b24e114fc7a0c5cc",
+ "016f278e55e9413e87687c59f27f77dc",
+ "13ccf5e5dd704b958a4b1d81d83bbe45",
+ "c47fe8ba1d674cd4b089230ac211ed1a",
+ "c18447aa88b8466aada1604f62a1e193",
+ "5b332bce2ee14a499e7867fe8f429b2d",
+ "043bf4419e49410cbe5fbcc103b4a17c",
+ "36a72fe07d434fd289844abe34a56bb8",
+ "52d85fbff5474c4cb25b28cb55a194a6",
+ "ba99479495564a5b9b3693a395828784",
+ "7e712c6fb44445a987c858bd8bdd347b",
+ "383aa217c6a848e191b421cc4a0346bf",
+ "538ef4577808453d8f3e6f6edc36ee1c",
+ "ffc624464e7f44ca9950e17570e70a99",
+ "60d4de86cf364df0935b5e1f19b2c6be",
+ "f7dc91d8904946a780e86ce4f0f4d5ed",
+ "dab01d139ae243cfa0389c5079ed3bfe",
+ "2ae8c5f6175c493cbc8e96552705ba37",
+ "4a9cdbfe12ac45be984b3a8f73d29dc1",
+ "c84f0d47fd3942be964ca7010f13c348",
+ "eac19f45ccb54329b42bbcb19a1f2fd4",
+ "5f353fa6b6f54b5ba9428ce4d8f3f1be",
+ "6465f64833024879b6ca055ceed6ed9d",
+ "281ea8998cbf40ee855310d991e979b8"
+ ]
+ },
+ "outputId": "8bdc5d38-c3d2-458e-dfbb-e825ea290a0f"
+ },
+ "outputs": [
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "tokenizer_config.json: 0%| | 0.00/9.35k [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "cf7e01f9046d4c22962a648618ad5f7c"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "tokenizer.json: 0%| | 0.00/2.12M [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "37be9d87487f4a65bb3a553e054a9b9f"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "special_tokens_map.json: 0%| | 0.00/587 [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "2c3628d3032f43f1a5698b863422be9c"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "config.json: 0%| | 0.00/738 [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "a0cb3fa115ef4c2e90618a9fd9249e9c"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "model.safetensors.index.json: 0%| | 0.00/29.4k [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "67185d66e50e4578bdabd94304bb673b"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "Downloading shards: 0%| | 0/2 [00:00, ?it/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "1562cb138c5a413c859a701ed5b70dba"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "model-00001-of-00002.safetensors: 0%| | 0.00/4.98G [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "0631ef1ac59a40dcb194ea0bf2ba94b6"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "model-00002-of-00002.safetensors: 0%| | 0.00/610M [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "252f7db506bb41ec986f88ea4d5d4d36"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "Loading checkpoint shards: 0%| | 0/2 [00:00, ?it/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "13ccf5e5dd704b958a4b1d81d83bbe45"
+ }
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "generation_config.json: 0%| | 0.00/132 [00:00, ?B/s]"
+ ],
+ "application/vnd.jupyter.widget-view+json": {
+ "version_major": 2,
+ "version_minor": 0,
+ "model_id": "ffc624464e7f44ca9950e17570e70a99"
+ }
+ },
+ "metadata": {}
+ }
+ ],
+ "source": [
+ "seed=14\n",
+ "\n",
+ "\n",
+ "if (prev_checkpoint != None):\n",
+ " try:\n",
+ " download_checkpoint(out_name, prev_checkpoint)\n",
+ " except:\n",
+ " pass\n",
+ "tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True, token=READ_TOKEN, map_device=\"auto\", add_eos_token=True, use_fast=True)\n",
+ "\n",
+ "new_tokens = {'additional_special_tokens': ['[SQL]','[/SQL]', '[QUESTION]','[/QUESTION]']}\n",
+ "#adicionar tokens especiais:\n",
+ "# if (prev_checkpoint == None):\n",
+ "# tokenizer.add_special_tokens(new_tokens)\n",
+ "\n",
+ "\n",
+ "if torch.cuda.is_bf16_supported():\n",
+ " compute_dtype = torch.bfloat16\n",
+ " attn_implementation = 'flash_attention_2'\n",
+ "else:\n",
+ " compute_dtype = torch.float16\n",
+ " attn_implementation = 'sdpa'\n",
+ "\n",
+ "tokenizer.pad_token = tokenizer.eos_token\n",
+ "tokenizer.padding_side = \"right\"\n",
+ "\n",
+ "\n",
+ "bnb_config = BitsAndBytesConfig(\n",
+ " load_in_4bit=True,\n",
+ " bnb_4bit_quant_type=\"nf4\",\n",
+ " bnb_4bit_compute_dtype=compute_dtype,\n",
+ " bnb_4bit_use_double_quant=False,\n",
+ ")\n",
+ "\n",
+ "model = AutoModelForCausalLM.from_pretrained(\n",
+ " model_name,\n",
+ " torch_dtype=compute_dtype,\n",
+ " device_map=\"auto\",\n",
+ " quantization_config=bnb_config,\n",
+ "\n",
+ " trust_remote_code=True,\n",
+ " token=READ_TOKEN,\n",
+ " # attn_implementation=attn_implementation\n",
+ ")\n",
+ "\n",
+ "# se adicionar special_tokens tem que fazer resize do tokenizer:\n",
+ "# model.resize_token_embeddings(len(tokenizer))\n",
+ "\n",
+ "## model.resize_token_embeddings(max(len(tokenizer), model.config.vocab_size))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# se adicionar special_tokens tem que fazer resize do tokenizer:\n",
+ "#model.resize_token_embeddings(len(tokenizer))\n",
+ "\n",
+ "#model.resize_token_embeddings(max(len(tokenizer), model.config.vocab_size))"
+ ],
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ },
+ "id": "fLuqzhSJBvi8",
+ "outputId": "65293049-fcc8-491b-aaca-579bca0686c7"
+ },
+ "execution_count": null,
+ "outputs": [
+ {
+ "output_type": "stream",
+ "name": "stderr",
+ "text": [
+ "The new embeddings will be initialized from a multivariate normal distribution that has old embeddings' mean and covariance. As described in this article: https://nlp.stanford.edu/~johnhew/vocab-expansion.html. To disable this, use `mean_resizing=False`\n",
+ "The new lm_head weights will be initialized from a multivariate normal distribution that has old embeddings' mean and covariance. As described in this article: https://nlp.stanford.edu/~johnhew/vocab-expansion.html. To disable this, use `mean_resizing=False`\n"
+ ]
+ },
+ {
+ "output_type": "execute_result",
+ "data": {
+ "text/plain": [
+ "Embedding(32004, 2048)"
+ ]
+ },
+ "metadata": {},
+ "execution_count": 8
+ }
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "id": "leGEqxURAL4r"
+ },
+ "source": [
+ "#### Chat Template - Schema Linking"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# tokenizer.chat_template = \"\"\"\n",
+ "# {% if messages[0]['role'] == 'system' %}\n",
+ "# {% set loop_messages = messages[1:] %}\n",
+ "# {% set system_message = messages[0]['content'] %}\n",
+ "# {% else %}\n",
+ "# {% set loop_messages = messages %}\n",
+ "# {% set system_message = 'You are an SQL expert tasked with answering questions about an SQLite database./n/Your responses must always consist of valid SQL code and only that.' %}\n",
+ "# {% endif %}\n",
+ "# {{ '# <|system|>/n/' + system_message + '/n//n/' }}\n",
+ "# {% if messages|selectattr(\"role\", \"equalto\", \"example\")|list %}\n",
+ "# Below are some examples of question and their corresponding SQL queries:/n//n/\n",
+ "# {% else %}\n",
+ "# /n/\n",
+ "# {% endif %}\n",
+ "# {% for message in loop_messages %}\n",
+ "# {% if message['role'] == 'example' %}\n",
+ "# {{ message['content'] }}/n//n/\n",
+ "# {% elif message['role'] == 'schema' %}\n",
+ "# # <|schema|>/n/The query will run on a database with the following schema:/n/{{ message['content'] }}/n//n/\n",
+ "# {% elif message['role'] == 'user' %}\n",
+ "# # <|user|>/n/[QUESTION]{{ message['content'] }}[/QUESTION]/n//n/\n",
+ "# {% elif message['role'] == 'assistant' %}\n",
+ "# # <|assistant|>/n/[SQL]{{ message['content'] }}[/SQL]\n",
+ "# {% endif %}\n",
+ "# {% endfor %}\n",
+ "# {% if add_generation_prompt %}\n",
+ "# # <|assistant|>/n/[SQL]\n",
+ "# {% endif %}\n",
+ "# \"\"\".replace(\"\\n\",\"\").replace(\" \", \"\").replace(\"/n/\", \"\\n\")\n"
+ ],
+ "metadata": {
+ "id": "Jiq-S5I1KOBr"
+ },
+ "execution_count": null,
+ "outputs": []
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "aHGTJNq2AmUs"
+ },
+ "outputs": [],
+ "source": [
+ "def to_sql(query):\n",
+ " return sqlparse.format(query, reindent=True, keyword_case='upper')\n",
+ "\n",
+ "def replace_last_sql_content(text, new_content):\n",
+ " matches = list(re.finditer(r'```sql (.*?)```', text, re.DOTALL))\n",
+ " if not matches:\n",
+ " return text\n",
+ "\n",
+ " last_match = matches[-1]\n",
+ "\n",
+ " start, end = last_match.span(1)\n",
+ " return text[:start] + new_content + text[end:]\n",
+ "\n",
+ "# def apply_template(row, tokenizer=tokenizer, n_examplea=0):\n",
+ "# question = row['question_en']\n",
+ "# schema = row['schema_llm']\n",
+ "# sql = to_sql(row['query_llm'])\n",
+ "\n",
+ "# system = \"Given a user question and the schema of a database, your task is to generate an SQL query that accurately answers the question based on the provided schema.\"\n",
+ "\n",
+ "\n",
+ "# chat = [{'role': 'user', 'content': f\"# System:\\n{system}\\n\\n# Schema:\\n```sql\\n{schema}\\n```\\n\\n# Question: {question}\"},\n",
+ "# {'role': 'assistant', 'content': f\"```sql\\n{sql}\\n```\"}\n",
+ "# ]\n",
+ "\n",
+ "# row['text'] = tokenizer.apply_chat_template(chat, tokenize=False, add_generation_prompt=False)\n",
+ "\n",
+ "# return row\n",
+ "\n",
+ "def apply_template(row, tokenizer=tokenizer, n_examplea=0):\n",
+ " question = row['question_en']\n",
+ " schema = row['schema_llm_t']\n",
+ " schema_linking = to_sql(row['selector_correct'])\n",
+ "\n",
+ " system = \"Given a user question and the schema of a database, your task is to generate an JSON with the the names of tables and columns of the schema that the question is referring to.\"\n",
+ "\n",
+ " chat = [{'role': 'user', 'content': f\"# System:\\n{system}\\n\\n# Schema:\\n```sql\\n{schema}\\n```\\n\\n# Question: {question}\"},\n",
+ " {'role': 'assistant', 'content': f\"```json\\n{schema_linking}\\n```\"}\n",
+ " ]\n",
+ "\n",
+ " row['text'] = tokenizer.apply_chat_template(chat, tokenize=False, add_generation_prompt=False)\n",
+ "\n",
+ " return row"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# spider_chain = json.load(open(\"/content/drive/Shareddrives/LLMs/Datasets/spider/spider_chain.json\", \"r\"))\n",
+ "# bird_chain = json.load(open(\"/content/drive/Shareddrives/LLMs/Datasets/bird/bird_chain.json\", \"r\"))"
+ ],
+ "metadata": {
+ "id": "QlA1kMj83Vql"
+ },
+ "execution_count": null,
+ "outputs": []
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# df['chain'] = spider_chain + bird_chain"
+ ],
+ "metadata": {
+ "id": "pCcD4TiC3rpb"
+ },
+ "execution_count": null,
+ "outputs": []
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "yvcMZAL3E3TB"
+ },
+ "outputs": [],
+ "source": [
+ "df = df.apply(apply_template, axis=1)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "df.head()"
+ ],
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 539
+ },
+ "id": "rQ0KUl2w58K9",
+ "outputId": "664b4e86-fe9f-45ee-bd2b-ea021a31b08f"
+ },
+ "execution_count": null,
+ "outputs": [
+ {
+ "output_type": "execute_result",
+ "data": {
+ "text/plain": [
+ " db_id schema \\\n",
+ "0 department_management \\nCREATE TABLE department (\\n\\t\"Department_ID\"... \n",
+ "1 department_management \\nCREATE TABLE department (\\n\\t\"Department_ID\"... \n",
+ "2 department_management \\nCREATE TABLE department (\\n\\t\"Department_ID\"... \n",
+ "3 department_management \\nCREATE TABLE department (\\n\\t\"Department_ID\"... \n",
+ "4 department_management \\nCREATE TABLE department (\\n\\t\"Department_ID\"... \n",
+ "\n",
+ " question_en hardness \\\n",
+ "0 How many heads of the departments are older th... easy \n",
+ "1 List the name, born state and age of the heads... medium \n",
+ "2 List the creation year, name and budget of eac... medium \n",
+ "3 What are the maximum and minimum budget of the... medium \n",
+ "4 What is the average number of employees of the... easy \n",
+ "\n",
+ " schema_llm \\\n",
+ "0 Table department (\\n department.Department_... \n",
+ "1 Table department (\\n department.Department_... \n",
+ "2 Table department (\\n department.Department_... \n",
+ "3 Table department (\\n department.Department_... \n",
+ "4 Table department (\\n department.Department_... \n",
+ "\n",
+ " query_llm \\\n",
+ "0 SELECT count(*) FROM head WHERE age > 56 \n",
+ "1 SELECT name , born_state , age FROM head ORD... \n",
+ "2 SELECT creation , name , budget_in_billions ... \n",
+ "3 SELECT max(budget_in_billions) , min(budget_i... \n",
+ "4 SELECT avg(num_employees) FROM department WHER... \n",
+ "\n",
+ " selector \\\n",
+ "0 {\\n 'head': ['head_id', 'age']\\n} \n",
+ "1 {\\n 'head': ['head_id', 'name', 'born_state',... \n",
+ "2 {\\n 'department': ['department_id', 'name', '... \n",
+ "3 {\\n 'department': ['department_id', 'budget_i... \n",
+ "4 {\\n 'department': ['department_id', 'ranking'... \n",
+ "\n",
+ " schema_llm_ct \\\n",
+ "0 CREATE TABLE department (\\n department.Depa... \n",
+ "1 CREATE TABLE department (\\n department.Depa... \n",
+ "2 CREATE TABLE department (\\n department.Depa... \n",
+ "3 CREATE TABLE department (\\n department.Depa... \n",
+ "4 CREATE TABLE department (\\n department.Depa... \n",
+ "\n",
+ " schema_llm_columns_min \\\n",
+ "0 Table department (\\n department.department_... \n",
+ "1 Table department (\\n department.department_... \n",
+ "2 Table department (\\n department.department_... \n",
+ "3 Table department (\\n department.department_... \n",
+ "4 Table department (\\n department.department_... \n",
+ "\n",
+ " schema_llm_columns_min_ct \\\n",
+ "0 CREATE TABLE department (\\n department.depa... \n",
+ "1 CREATE TABLE department (\\n department.depa... \n",
+ "2 CREATE TABLE department (\\n department.depa... \n",
+ "3 CREATE TABLE department (\\n department.depa... \n",
+ "4 CREATE TABLE department (\\n department.depa... \n",
+ "\n",
+ " schema_llm_all_min \\\n",
+ "0 Table department (\\n department.department_... \n",
+ "1 Table department (\\n department.department_... \n",
+ "2 Table department (\\n department.department_... \n",
+ "3 Table department (\\n department.department_... \n",
+ "4 Table department (\\n department.department_... \n",
+ "\n",
+ " schema_llm_all_min_ct \\\n",
+ "0 CREATE TABLE department (\\n department.depa... \n",
+ "1 CREATE TABLE department (\\n department.depa... \n",
+ "2 CREATE TABLE department (\\n department.depa... \n",
+ "3 CREATE TABLE department (\\n department.depa... \n",
+ "4 CREATE TABLE department (\\n department.depa... \n",
+ "\n",
+ " schema_dict \\\n",
+ "0 {\\n 'department': ['Department_ID', 'Name', '... \n",
+ "1 {\\n 'department': ['Department_ID', 'Name', '... \n",
+ "2 {\\n 'department': ['Department_ID', 'Name', '... \n",
+ "3 {\\n 'department': ['Department_ID', 'Name', '... \n",
+ "4 {\\n 'department': ['Department_ID', 'Name', '... \n",
+ "\n",
+ " selector_correct \\\n",
+ "0 {\\n 'head': ['head_ID', 'age']\\n} \n",
+ "1 {\\n 'head': ['head_ID', 'name', 'born_state',... \n",
+ "2 {\\n 'department': ['Department_ID', 'Name', '... \n",
+ "3 {\\n 'department': ['Department_ID', 'Budget_i... \n",
+ "4 {\\n 'department': ['Department_ID', 'Ranking'... \n",
+ "\n",
+ " schema_llm_t \\\n",
+ "0 TABLE department (\\n department.Department_... \n",
+ "1 TABLE department (\\n department.Department_... \n",
+ "2 TABLE department (\\n department.Department_... \n",
+ "3 TABLE department (\\n department.Department_... \n",
+ "4 TABLE department (\\n department.Department_... \n",
+ "\n",
+ " schema_llm_columns_min_t \\\n",
+ "0 TABLE department (\\n department.department_... \n",
+ "1 TABLE department (\\n department.department_... \n",
+ "2 TABLE department (\\n department.department_... \n",
+ "3 TABLE department (\\n department.department_... \n",
+ "4 TABLE department (\\n department.department_... \n",
+ "\n",
+ " schema_llm_all_min_t \\\n",
+ "0 TABLE department (\\n department.department_... \n",
+ "1 TABLE department (\\n department.department_... \n",
+ "2 TABLE department (\\n department.department_... \n",
+ "3 TABLE department (\\n department.department_... \n",
+ "4 TABLE department (\\n department.department_... \n",
+ "\n",
+ " text \n",
+ "0 <|begin_of_text|><|start_header_id|>system<|en... \n",
+ "1 <|begin_of_text|><|start_header_id|>system<|en... \n",
+ "2 <|begin_of_text|><|start_header_id|>system<|en... \n",
+ "3 <|begin_of_text|><|start_header_id|>system<|en... \n",
+ "4 <|begin_of_text|><|start_header_id|>system<|en... "
+ ],
+ "text/html": [
+ "\n",
+ "
\n",
+ "
\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " db_id | \n",
+ " schema | \n",
+ " question_en | \n",
+ " hardness | \n",
+ " schema_llm | \n",
+ " query_llm | \n",
+ " selector | \n",
+ " schema_llm_ct | \n",
+ " schema_llm_columns_min | \n",
+ " schema_llm_columns_min_ct | \n",
+ " schema_llm_all_min | \n",
+ " schema_llm_all_min_ct | \n",
+ " schema_dict | \n",
+ " selector_correct | \n",
+ " schema_llm_t | \n",
+ " schema_llm_columns_min_t | \n",
+ " schema_llm_all_min_t | \n",
+ " text | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " department_management | \n",
+ " \\nCREATE TABLE department (\\n\\t\"Department_ID\"... | \n",
+ " How many heads of the departments are older th... | \n",
+ " easy | \n",
+ " Table department (\\n department.Department_... | \n",
+ " SELECT count(*) FROM head WHERE age > 56 | \n",
+ " {\\n 'head': ['head_id', 'age']\\n} | \n",
+ " CREATE TABLE department (\\n department.Depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " {\\n 'department': ['Department_ID', 'Name', '... | \n",
+ " {\\n 'head': ['head_ID', 'age']\\n} | \n",
+ " TABLE department (\\n department.Department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " <|begin_of_text|><|start_header_id|>system<|en... | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " department_management | \n",
+ " \\nCREATE TABLE department (\\n\\t\"Department_ID\"... | \n",
+ " List the name, born state and age of the heads... | \n",
+ " medium | \n",
+ " Table department (\\n department.Department_... | \n",
+ " SELECT name , born_state , age FROM head ORD... | \n",
+ " {\\n 'head': ['head_id', 'name', 'born_state',... | \n",
+ " CREATE TABLE department (\\n department.Depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " {\\n 'department': ['Department_ID', 'Name', '... | \n",
+ " {\\n 'head': ['head_ID', 'name', 'born_state',... | \n",
+ " TABLE department (\\n department.Department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " <|begin_of_text|><|start_header_id|>system<|en... | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " department_management | \n",
+ " \\nCREATE TABLE department (\\n\\t\"Department_ID\"... | \n",
+ " List the creation year, name and budget of eac... | \n",
+ " medium | \n",
+ " Table department (\\n department.Department_... | \n",
+ " SELECT creation , name , budget_in_billions ... | \n",
+ " {\\n 'department': ['department_id', 'name', '... | \n",
+ " CREATE TABLE department (\\n department.Depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " {\\n 'department': ['Department_ID', 'Name', '... | \n",
+ " {\\n 'department': ['Department_ID', 'Name', '... | \n",
+ " TABLE department (\\n department.Department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " <|begin_of_text|><|start_header_id|>system<|en... | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " department_management | \n",
+ " \\nCREATE TABLE department (\\n\\t\"Department_ID\"... | \n",
+ " What are the maximum and minimum budget of the... | \n",
+ " medium | \n",
+ " Table department (\\n department.Department_... | \n",
+ " SELECT max(budget_in_billions) , min(budget_i... | \n",
+ " {\\n 'department': ['department_id', 'budget_i... | \n",
+ " CREATE TABLE department (\\n department.Depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " {\\n 'department': ['Department_ID', 'Name', '... | \n",
+ " {\\n 'department': ['Department_ID', 'Budget_i... | \n",
+ " TABLE department (\\n department.Department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " <|begin_of_text|><|start_header_id|>system<|en... | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " department_management | \n",
+ " \\nCREATE TABLE department (\\n\\t\"Department_ID\"... | \n",
+ " What is the average number of employees of the... | \n",
+ " easy | \n",
+ " Table department (\\n department.Department_... | \n",
+ " SELECT avg(num_employees) FROM department WHER... | \n",
+ " {\\n 'department': ['department_id', 'ranking'... | \n",
+ " CREATE TABLE department (\\n department.Depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " Table department (\\n department.department_... | \n",
+ " CREATE TABLE department (\\n department.depa... | \n",
+ " {\\n 'department': ['Department_ID', 'Name', '... | \n",
+ " {\\n 'department': ['Department_ID', 'Ranking'... | \n",
+ " TABLE department (\\n department.Department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " TABLE department (\\n department.department_... | \n",
+ " <|begin_of_text|><|start_header_id|>system<|en... | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
\n",
+ "
\n",
+ "
\n"
+ ],
+ "application/vnd.google.colaboratory.intrinsic+json": {
+ "type": "dataframe",
+ "variable_name": "df",
+ "summary": "{\n \"name\": \"df\",\n \"rows\": 8656,\n \"fields\": [\n {\n \"column\": \"db_id\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 146,\n \"samples\": [\n \"gas_company\",\n \"customers_campaigns_ecommerce\",\n \"performance_attendance\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 146,\n \"samples\": [\n \"\\nCREATE TABLE company (\\n\\t\\\"Company_ID\\\" INTEGER, \\n\\t\\\"Rank\\\" INTEGER, \\n\\t\\\"Company\\\" TEXT, \\n\\t\\\"Headquarters\\\" TEXT, \\n\\t\\\"Main_Industry\\\" TEXT, \\n\\t\\\"Sales_billion\\\" REAL, \\n\\t\\\"Profits_billion\\\" REAL, \\n\\t\\\"Assets_billion\\\" REAL, \\n\\t\\\"Market_Value\\\" REAL, \\n\\tPRIMARY KEY (\\\"Company_ID\\\")\\n)\\n\\n\\nCREATE TABLE gas_station (\\n\\t\\\"Station_ID\\\" INTEGER, \\n\\t\\\"Open_Year\\\" INTEGER, \\n\\t\\\"Location\\\" TEXT, \\n\\t\\\"Manager_Name\\\" TEXT, \\n\\t\\\"Vice_Manager_Name\\\" TEXT, \\n\\t\\\"Representative_Name\\\" TEXT, \\n\\tPRIMARY KEY (\\\"Station_ID\\\")\\n)\\n\\n\\nCREATE TABLE station_company (\\n\\t\\\"Station_ID\\\" INTEGER, \\n\\t\\\"Company_ID\\\" INTEGER, \\n\\t\\\"Rank_of_the_Year\\\" INTEGER, \\n\\tPRIMARY KEY (\\\"Station_ID\\\", \\\"Company_ID\\\"), \\n\\tFOREIGN KEY(\\\"Company_ID\\\") REFERENCES company (\\\"Company_ID\\\"), \\n\\tFOREIGN KEY(\\\"Station_ID\\\") REFERENCES gas_station (\\\"Station_ID\\\")\\n)\",\n \"\\nCREATE TABLE \\\"Customer_Addresses\\\" (\\n\\tcustomer_id INTEGER NOT NULL, \\n\\tpremise_id INTEGER NOT NULL, \\n\\tdate_address_from DATETIME NOT NULL, \\n\\taddress_type_code VARCHAR(15) NOT NULL, \\n\\tdate_address_to DATETIME, \\n\\tFOREIGN KEY(customer_id) REFERENCES \\\"Customers\\\" (customer_id), \\n\\tFOREIGN KEY(premise_id) REFERENCES \\\"Premises\\\" (premise_id)\\n)\\n\\n\\nCREATE TABLE \\\"Customer_Orders\\\" (\\n\\torder_id INTEGER, \\n\\tcustomer_id INTEGER NOT NULL, \\n\\torder_status_code VARCHAR(15) NOT NULL, \\n\\tshipping_method_code VARCHAR(15) NOT NULL, \\n\\torder_placed_datetime DATETIME NOT NULL, \\n\\torder_delivered_datetime DATETIME, \\n\\torder_shipping_charges VARCHAR(255), \\n\\tPRIMARY KEY (order_id), \\n\\tFOREIGN KEY(customer_id) REFERENCES \\\"Customers\\\" (customer_id)\\n)\\n\\n\\nCREATE TABLE \\\"Customers\\\" (\\n\\tcustomer_id INTEGER, \\n\\tpayment_method VARCHAR(15) NOT NULL, \\n\\tcustomer_name VARCHAR(80), \\n\\tcustomer_phone VARCHAR(80), \\n\\tcustomer_email VARCHAR(80), \\n\\tcustomer_address VARCHAR(255), \\n\\tcustomer_login VARCHAR(80), \\n\\tcustomer_password VARCHAR(10), \\n\\tPRIMARY KEY (customer_id)\\n)\\n\\n\\nCREATE TABLE \\\"Mailshot_Campaigns\\\" (\\n\\tmailshot_id INTEGER, \\n\\tproduct_category VARCHAR(15), \\n\\tmailshot_name VARCHAR(80), \\n\\tmailshot_start_date DATETIME, \\n\\tmailshot_end_date DATETIME, \\n\\tPRIMARY KEY (mailshot_id)\\n)\\n\\n\\nCREATE TABLE \\\"Mailshot_Customers\\\" (\\n\\tmailshot_id INTEGER NOT NULL, \\n\\tcustomer_id INTEGER NOT NULL, \\n\\toutcome_code VARCHAR(15) NOT NULL, \\n\\tmailshot_customer_date DATETIME, \\n\\tFOREIGN KEY(mailshot_id) REFERENCES \\\"Mailshot_Campaigns\\\" (mailshot_id), \\n\\tFOREIGN KEY(customer_id) REFERENCES \\\"Customers\\\" (customer_id)\\n)\\n\\n\\nCREATE TABLE \\\"Order_Items\\\" (\\n\\titem_id INTEGER NOT NULL, \\n\\torder_item_status_code VARCHAR(15) NOT NULL, \\n\\torder_id INTEGER NOT NULL, \\n\\tproduct_id INTEGER NOT NULL, \\n\\titem_status_code VARCHAR(15), \\n\\titem_delivered_datetime DATETIME, \\n\\titem_order_quantity VARCHAR(80), \\n\\tFOREIGN KEY(order_id) REFERENCES \\\"Customer_Orders\\\" (order_id), \\n\\tFOREIGN KEY(product_id) REFERENCES \\\"Products\\\" (product_id)\\n)\\n\\n\\nCREATE TABLE \\\"Premises\\\" (\\n\\tpremise_id INTEGER, \\n\\tpremises_type VARCHAR(15) NOT NULL, \\n\\tpremise_details VARCHAR(255), \\n\\tPRIMARY KEY (premise_id)\\n)\\n\\n\\nCREATE TABLE \\\"Products\\\" (\\n\\tproduct_id INTEGER, \\n\\tproduct_category VARCHAR(15) NOT NULL, \\n\\tproduct_name VARCHAR(80), \\n\\tPRIMARY KEY (product_id)\\n)\",\n \"\\nCREATE TABLE member (\\n\\t\\\"Member_ID\\\" TEXT, \\n\\t\\\"Name\\\" TEXT, \\n\\t\\\"Nationality\\\" TEXT, \\n\\t\\\"Role\\\" TEXT, \\n\\tPRIMARY KEY (\\\"Member_ID\\\")\\n)\\n\\n\\nCREATE TABLE member_attendance (\\n\\t\\\"Member_ID\\\" INTEGER, \\n\\t\\\"Performance_ID\\\" INTEGER, \\n\\t\\\"Num_of_Pieces\\\" INTEGER, \\n\\tPRIMARY KEY (\\\"Member_ID\\\", \\\"Performance_ID\\\"), \\n\\tFOREIGN KEY(\\\"Performance_ID\\\") REFERENCES performance (\\\"Performance_ID\\\"), \\n\\tFOREIGN KEY(\\\"Member_ID\\\") REFERENCES member (\\\"Member_ID\\\")\\n)\\n\\n\\nCREATE TABLE performance (\\n\\t\\\"Performance_ID\\\" REAL, \\n\\t\\\"Date\\\" TEXT, \\n\\t\\\"Host\\\" TEXT, \\n\\t\\\"Location\\\" TEXT, \\n\\t\\\"Attendance\\\" INTEGER, \\n\\tPRIMARY KEY (\\\"Performance_ID\\\")\\n)\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"question_en\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 8618,\n \"samples\": [\n \"What are the names of courses without prerequisites?\",\n \"Return the investor who have invested in the greatest number of entrepreneurs.\",\n \"Which customers have ever canceled the purchase of the product \\\"food\\\" (the item status is \\\"Cancel\\\")?\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"hardness\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 4,\n \"samples\": [\n \"medium\",\n \"extra\",\n \"easy\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_llm\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 146,\n \"samples\": [\n \"Table company (\\n company.Company_ID (INT),\\n company.Rank (INT),\\n company.Company (TEXT),\\n company.Headquarters (TEXT),\\n company.Main_Industry (TEXT),\\n company.Sales_billion (REAL),\\n company.Profits_billion (REAL),\\n company.Assets_billion (REAL),\\n company.Market_Value (REAL),\\n)\\n\\nTable gas_station (\\n gas_station.Station_ID (INT),\\n gas_station.Open_Year (INT),\\n gas_station.Location (TEXT),\\n gas_station.Manager_Name (TEXT),\\n gas_station.Vice_Manager_Name (TEXT),\\n gas_station.Representative_Name (TEXT),\\n)\\n\\nTable station_company (\\n station_company.Station_ID (INT),\\n station_company.Company_ID (INT),\\n station_company.Rank_of_the_Year (INT),\\n)\\n\\n\\nPossible JOINs:\\n\\nstation_company.Station_ID = gas_station.Station_ID\\nstation_company.Company_ID = company.Company_ID\\n\",\n \"Table Customer_Addresses (\\n Customer_Addresses.customer_id (INTEGER),\\n Customer_Addresses.premise_id (INTEGER),\\n Customer_Addresses.date_address_from (DATETIME),\\n Customer_Addresses.address_type_code (VARCHAR(15)),\\n Customer_Addresses.date_address_to (DATETIME),\\n)\\n\\nTable Customer_Orders (\\n Customer_Orders.order_id (INTEGER),\\n Customer_Orders.customer_id (INTEGER),\\n Customer_Orders.order_status_code (VARCHAR(15)),\\n Customer_Orders.shipping_method_code (VARCHAR(15)),\\n Customer_Orders.order_placed_datetime (DATETIME),\\n Customer_Orders.order_delivered_datetime (DATETIME),\\n Customer_Orders.order_shipping_charges (VARCHAR(255)),\\n)\\n\\nTable Customers (\\n Customers.customer_id (INTEGER),\\n Customers.payment_method (VARCHAR(15)),\\n Customers.customer_name (VARCHAR(80)),\\n Customers.customer_phone (VARCHAR(80)),\\n Customers.customer_email (VARCHAR(80)),\\n Customers.customer_address (VARCHAR(255)),\\n Customers.customer_login (VARCHAR(80)),\\n Customers.customer_password (VARCHAR(10)),\\n)\\n\\nTable Mailshot_Campaigns (\\n Mailshot_Campaigns.mailshot_id (INTEGER),\\n Mailshot_Campaigns.product_category (VARCHAR(15)),\\n Mailshot_Campaigns.mailshot_name (VARCHAR(80)),\\n Mailshot_Campaigns.mailshot_start_date (DATETIME),\\n Mailshot_Campaigns.mailshot_end_date (DATETIME),\\n)\\n\\nTable Mailshot_Customers (\\n Mailshot_Customers.mailshot_id (INTEGER),\\n Mailshot_Customers.customer_id (INTEGER),\\n Mailshot_Customers.outcome_code (VARCHAR(15)),\\n Mailshot_Customers.mailshot_customer_date (DATETIME),\\n)\\n\\nTable Order_Items (\\n Order_Items.item_id (INTEGER),\\n Order_Items.order_item_status_code (VARCHAR(15)),\\n Order_Items.order_id (INTEGER),\\n Order_Items.product_id (INTEGER),\\n Order_Items.item_status_code (VARCHAR(15)),\\n Order_Items.item_delivered_datetime (DATETIME),\\n Order_Items.item_order_quantity (VARCHAR(80)),\\n)\\n\\nTable Premises (\\n Premises.premise_id (INTEGER),\\n Premises.premises_type (VARCHAR(15)),\\n Premises.premise_details (VARCHAR(255)),\\n)\\n\\nTable Products (\\n Products.product_id (INTEGER),\\n Products.product_category (VARCHAR(15)),\\n Products.product_name (VARCHAR(80)),\\n)\\n\\n\\nPossible JOINs:\\n\\nCustomer_Addresses.customer_id = Customers.customer_id\\nCustomer_Addresses.premise_id = Premises.premise_id\\n\\nCustomer_Orders.customer_id = Customers.customer_id\\n\\nMailshot_Customers.mailshot_id = Mailshot_Campaigns.mailshot_id\\nMailshot_Customers.customer_id = Customers.customer_id\\n\\nOrder_Items.order_id = Customer_Orders.order_id\\nOrder_Items.product_id = Products.product_id\\n\",\n \"Table member (\\n member.Member_ID (TEXT),\\n member.Name (TEXT),\\n member.Nationality (TEXT),\\n member.Role (TEXT),\\n)\\n\\nTable member_attendance (\\n member_attendance.Member_ID (INT),\\n member_attendance.Performance_ID (INT),\\n member_attendance.Num_of_Pieces (INT),\\n)\\n\\nTable performance (\\n performance.Performance_ID (REAL),\\n performance.Date (TEXT),\\n performance.Host (TEXT),\\n performance.Location (TEXT),\\n performance.Attendance (INT),\\n)\\n\\n\\nPossible JOINs:\\n\\nmember_attendance.Member_ID = member.Member_ID\\nmember_attendance.Performance_ID = performance.Performance_ID\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"query_llm\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 4712,\n \"samples\": [\n \"SELECT manager_name FROM gas_station WHERE open_year > 2000 GROUP BY manager_name ORDER BY count(*) DESC LIMIT 1\",\n \"SELECT lname FROM authors WHERE fname = \\\"Amal\\\"\",\n \"SELECT * FROM swimmer\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"selector\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 3358,\n \"samples\": [\n \"{\\n 'rating': ['mid', 'stars'],\\n 'movie': ['mid', 'title', 'director']\\n}\",\n \"{\\n 'player': ['birth_country', 'bats']\\n}\",\n \"{\\n 'bank': ['branch_id', 'city']\\n}\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_llm_ct\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 147,\n \"samples\": [\n \"CREATE TABLE country (\\n country.Country_ID (INT),\\n country.Name (TEXT),\\n country.Population (INT),\\n country.Area (INT),\\n country.Languages (TEXT),\\n)\\n\\nCREATE TABLE roller_coaster (\\n roller_coaster.Roller_Coaster_ID (INT),\\n roller_coaster.Name (TEXT),\\n roller_coaster.Park (TEXT),\\n roller_coaster.Country_ID (INT),\\n roller_coaster.Length (REAL),\\n roller_coaster.Height (REAL),\\n roller_coaster.Speed (TEXT),\\n roller_coaster.Opened (TEXT),\\n roller_coaster.Status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nroller_coaster.Country_ID = country.Country_ID\\n\",\n \"CREATE TABLE circuits (\\n circuits.circuitId (INTEGER),\\n circuits.circuitRef (TEXT),\\n circuits.name (TEXT),\\n circuits.location (TEXT),\\n circuits.country (TEXT),\\n circuits.lat (REAL),\\n circuits.lng (REAL),\\n circuits.alt (TEXT),\\n circuits.url (TEXT),\\n)\\n\\nCREATE TABLE constructorResults (\\n constructorResults.constructorResultsId (INTEGER),\\n constructorResults.raceId (INTEGER),\\n constructorResults.constructorId (INTEGER),\\n constructorResults.points (REAL),\\n constructorResults.status (TEXT),\\n)\\n\\nCREATE TABLE constructorStandings (\\n constructorStandings.constructorStandingsId (INTEGER),\\n constructorStandings.raceId (INTEGER),\\n constructorStandings.constructorId (INTEGER),\\n constructorStandings.points (REAL),\\n constructorStandings.position (INTEGER),\\n constructorStandings.positionText (TEXT),\\n constructorStandings.wins (INTEGER),\\n)\\n\\nCREATE TABLE constructors (\\n constructors.constructorId (INTEGER),\\n constructors.constructorRef (TEXT),\\n constructors.name (TEXT),\\n constructors.nationality (TEXT),\\n constructors.url (TEXT),\\n)\\n\\nCREATE TABLE driverStandings (\\n driverStandings.driverStandingsId (INTEGER),\\n driverStandings.raceId (INTEGER),\\n driverStandings.driverId (INTEGER),\\n driverStandings.points (REAL),\\n driverStandings.position (INTEGER),\\n driverStandings.positionText (TEXT),\\n driverStandings.wins (INTEGER),\\n)\\n\\nCREATE TABLE drivers (\\n drivers.driverId (INTEGER),\\n drivers.driverRef (TEXT),\\n drivers.number (TEXT),\\n drivers.code (TEXT),\\n drivers.forename (TEXT),\\n drivers.surname (TEXT),\\n drivers.dob (TEXT),\\n drivers.nationality (TEXT),\\n drivers.url (TEXT),\\n)\\n\\nCREATE TABLE lapTimes (\\n lapTimes.raceId (INTEGER),\\n lapTimes.driverId (INTEGER),\\n lapTimes.lap (INTEGER),\\n lapTimes.position (INTEGER),\\n lapTimes.time (TEXT),\\n lapTimes.milliseconds (INTEGER),\\n)\\n\\nCREATE TABLE pitStops (\\n pitStops.raceId (INTEGER),\\n pitStops.driverId (INTEGER),\\n pitStops.stop (INTEGER),\\n pitStops.lap (INTEGER),\\n pitStops.time (TEXT),\\n pitStops.duration (TEXT),\\n pitStops.milliseconds (INTEGER),\\n)\\n\\nCREATE TABLE qualifying (\\n qualifying.qualifyId (INTEGER),\\n qualifying.raceId (INTEGER),\\n qualifying.driverId (INTEGER),\\n qualifying.constructorId (INTEGER),\\n qualifying.number (INTEGER),\\n qualifying.position (INTEGER),\\n qualifying.q1 (TEXT),\\n qualifying.q2 (TEXT),\\n qualifying.q3 (TEXT),\\n)\\n\\nCREATE TABLE races (\\n races.raceId (INTEGER),\\n races.year (INTEGER),\\n races.round (INTEGER),\\n races.circuitId (INTEGER),\\n races.name (TEXT),\\n races.date (TEXT),\\n races.time (TEXT),\\n races.url (TEXT),\\n)\\n\\nCREATE TABLE results (\\n results.resultId (INTEGER),\\n results.raceId (INTEGER),\\n results.driverId (INTEGER),\\n results.constructorId (INTEGER),\\n results.number (INTEGER),\\n results.grid (INTEGER),\\n results.position (TEXT),\\n results.positionText (TEXT),\\n results.positionOrder (INTEGER),\\n results.points (REAL),\\n results.laps (TEXT),\\n results.time (TEXT),\\n results.milliseconds (TEXT),\\n results.fastestLap (TEXT),\\n results.rank (TEXT),\\n results.fastestLapTime (TEXT),\\n results.fastestLapSpeed (TEXT),\\n results.statusId (INTEGER),\\n)\\n\\nCREATE TABLE seasons (\\n seasons.year (INTEGER),\\n seasons.url (TEXT),\\n)\\n\\nCREATE TABLE status (\\n status.statusId (INTEGER),\\n status.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nconstructorResults.raceId = races.raceId\\nconstructorResults.constructorId = constructors.constructorId\\n\\nconstructorStandings.raceId = races.raceId\\nconstructorStandings.constructorId = constructors.constructorId\\n\\ndriverStandings.raceId = races.raceId\\ndriverStandings.driverId = drivers.driverId\\n\\nlapTimes.raceId = races.raceId\\nlapTimes.driverId = drivers.driverId\\n\\npitStops.raceId = races.raceId\\npitStops.driverId = drivers.driverId\\n\\nqualifying.raceId = races.raceId\\nqualifying.driverId = drivers.driverId\\nqualifying.constructorId = constructors.constructorId\\n\\nraces.circuitId = circuits.circuitId\\n\\nresults.raceId = races.raceId\\nresults.driverId = drivers.driverId\\nresults.constructorId = constructors.constructorId\\n\",\n \"CREATE TABLE Customers (\\n Customers.customer_id (INTEGER),\\n Customers.customer_name (VARCHAR(80)),\\n Customers.customer_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Invoices (\\n Invoices.invoice_number (INTEGER),\\n Invoices.invoice_date (DATETIME),\\n Invoices.invoice_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Order_Items (\\n Order_Items.order_item_id (INTEGER),\\n Order_Items.product_id (INTEGER),\\n Order_Items.order_id (INTEGER),\\n Order_Items.order_item_status (VARCHAR(10)),\\n Order_Items.order_item_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Orders (\\n Orders.order_id (INTEGER),\\n Orders.customer_id (INTEGER),\\n Orders.order_status (VARCHAR(10)),\\n Orders.date_order_placed (DATETIME),\\n Orders.order_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Products (\\n Products.product_id (INTEGER),\\n Products.product_name (VARCHAR(80)),\\n Products.product_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Shipment_Items (\\n Shipment_Items.shipment_id (INTEGER),\\n Shipment_Items.order_item_id (INTEGER),\\n)\\n\\nCREATE TABLE Shipments (\\n Shipments.shipment_id (INTEGER),\\n Shipments.order_id (INTEGER),\\n Shipments.invoice_number (INTEGER),\\n Shipments.shipment_tracking_number (VARCHAR(80)),\\n Shipments.shipment_date (DATETIME),\\n Shipments.other_shipment_details (VARCHAR(255)),\\n)\\n\\n\\nPossible JOINs:\\n\\nOrder_Items.product_id = Products.product_id\\nOrder_Items.order_id = Orders.order_id\\n\\nOrders.customer_id = Customers.customer_id\\n\\nShipment_Items.shipment_id = Shipments.shipment_id\\nShipment_Items.order_item_id = Order_Items.order_item_id\\n\\nShipments.order_id = Orders.order_id\\nShipments.invoice_number = Invoices.invoice_number\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_llm_columns_min\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 147,\n \"samples\": [\n \"Table country (\\n country.country_id (INT),\\n country.name (TEXT),\\n country.population (INT),\\n country.area (INT),\\n country.languages (TEXT),\\n)\\n\\nTable roller_coaster (\\n roller_coaster.roller_coaster_id (INT),\\n roller_coaster.name (TEXT),\\n roller_coaster.park (TEXT),\\n roller_coaster.country_id (INT),\\n roller_coaster.length (REAL),\\n roller_coaster.height (REAL),\\n roller_coaster.speed (TEXT),\\n roller_coaster.opened (TEXT),\\n roller_coaster.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nroller_coaster.country_id = country.country_id\\n\",\n \"Table circuits (\\n circuits.circuitid (INTEGER),\\n circuits.circuitref (TEXT),\\n circuits.name (TEXT),\\n circuits.location (TEXT),\\n circuits.country (TEXT),\\n circuits.lat (REAL),\\n circuits.lng (REAL),\\n circuits.alt (TEXT),\\n circuits.url (TEXT),\\n)\\n\\nTable constructorResults (\\n constructorResults.constructorresultsid (INTEGER),\\n constructorResults.raceid (INTEGER),\\n constructorResults.constructorid (INTEGER),\\n constructorResults.points (REAL),\\n constructorResults.status (TEXT),\\n)\\n\\nTable constructorStandings (\\n constructorStandings.constructorstandingsid (INTEGER),\\n constructorStandings.raceid (INTEGER),\\n constructorStandings.constructorid (INTEGER),\\n constructorStandings.points (REAL),\\n constructorStandings.position (INTEGER),\\n constructorStandings.positiontext (TEXT),\\n constructorStandings.wins (INTEGER),\\n)\\n\\nTable constructors (\\n constructors.constructorid (INTEGER),\\n constructors.constructorref (TEXT),\\n constructors.name (TEXT),\\n constructors.nationality (TEXT),\\n constructors.url (TEXT),\\n)\\n\\nTable driverStandings (\\n driverStandings.driverstandingsid (INTEGER),\\n driverStandings.raceid (INTEGER),\\n driverStandings.driverid (INTEGER),\\n driverStandings.points (REAL),\\n driverStandings.position (INTEGER),\\n driverStandings.positiontext (TEXT),\\n driverStandings.wins (INTEGER),\\n)\\n\\nTable drivers (\\n drivers.driverid (INTEGER),\\n drivers.driverref (TEXT),\\n drivers.number (TEXT),\\n drivers.code (TEXT),\\n drivers.forename (TEXT),\\n drivers.surname (TEXT),\\n drivers.dob (TEXT),\\n drivers.nationality (TEXT),\\n drivers.url (TEXT),\\n)\\n\\nTable lapTimes (\\n lapTimes.raceid (INTEGER),\\n lapTimes.driverid (INTEGER),\\n lapTimes.lap (INTEGER),\\n lapTimes.position (INTEGER),\\n lapTimes.time (TEXT),\\n lapTimes.milliseconds (INTEGER),\\n)\\n\\nTable pitStops (\\n pitStops.raceid (INTEGER),\\n pitStops.driverid (INTEGER),\\n pitStops.stop (INTEGER),\\n pitStops.lap (INTEGER),\\n pitStops.time (TEXT),\\n pitStops.duration (TEXT),\\n pitStops.milliseconds (INTEGER),\\n)\\n\\nTable qualifying (\\n qualifying.qualifyid (INTEGER),\\n qualifying.raceid (INTEGER),\\n qualifying.driverid (INTEGER),\\n qualifying.constructorid (INTEGER),\\n qualifying.number (INTEGER),\\n qualifying.position (INTEGER),\\n qualifying.q1 (TEXT),\\n qualifying.q2 (TEXT),\\n qualifying.q3 (TEXT),\\n)\\n\\nTable races (\\n races.raceid (INTEGER),\\n races.year (INTEGER),\\n races.round (INTEGER),\\n races.circuitid (INTEGER),\\n races.name (TEXT),\\n races.date (TEXT),\\n races.time (TEXT),\\n races.url (TEXT),\\n)\\n\\nTable results (\\n results.resultid (INTEGER),\\n results.raceid (INTEGER),\\n results.driverid (INTEGER),\\n results.constructorid (INTEGER),\\n results.number (INTEGER),\\n results.grid (INTEGER),\\n results.position (TEXT),\\n results.positiontext (TEXT),\\n results.positionorder (INTEGER),\\n results.points (REAL),\\n results.laps (TEXT),\\n results.time (TEXT),\\n results.milliseconds (TEXT),\\n results.fastestlap (TEXT),\\n results.rank (TEXT),\\n results.fastestlaptime (TEXT),\\n results.fastestlapspeed (TEXT),\\n results.statusid (INTEGER),\\n)\\n\\nTable seasons (\\n seasons.year (INTEGER),\\n seasons.url (TEXT),\\n)\\n\\nTable status (\\n status.statusid (INTEGER),\\n status.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nconstructorResults.raceid = races.raceid\\nconstructorResults.constructorid = constructors.constructorid\\n\\nconstructorStandings.raceid = races.raceid\\nconstructorStandings.constructorid = constructors.constructorid\\n\\ndriverStandings.raceid = races.raceid\\ndriverStandings.driverid = drivers.driverid\\n\\nlapTimes.raceid = races.raceid\\nlapTimes.driverid = drivers.driverid\\n\\npitStops.raceid = races.raceid\\npitStops.driverid = drivers.driverid\\n\\nqualifying.raceid = races.raceid\\nqualifying.driverid = drivers.driverid\\nqualifying.constructorid = constructors.constructorid\\n\\nraces.circuitid = circuits.circuitid\\n\\nresults.raceid = races.raceid\\nresults.driverid = drivers.driverid\\nresults.constructorid = constructors.constructorid\\n\",\n \"Table Customers (\\n Customers.customer_id (INTEGER),\\n Customers.customer_name (VARCHAR(80)),\\n Customers.customer_details (VARCHAR(255)),\\n)\\n\\nTable Invoices (\\n Invoices.invoice_number (INTEGER),\\n Invoices.invoice_date (DATETIME),\\n Invoices.invoice_details (VARCHAR(255)),\\n)\\n\\nTable Order_Items (\\n Order_Items.order_item_id (INTEGER),\\n Order_Items.product_id (INTEGER),\\n Order_Items.order_id (INTEGER),\\n Order_Items.order_item_status (VARCHAR(10)),\\n Order_Items.order_item_details (VARCHAR(255)),\\n)\\n\\nTable Orders (\\n Orders.order_id (INTEGER),\\n Orders.customer_id (INTEGER),\\n Orders.order_status (VARCHAR(10)),\\n Orders.date_order_placed (DATETIME),\\n Orders.order_details (VARCHAR(255)),\\n)\\n\\nTable Products (\\n Products.product_id (INTEGER),\\n Products.product_name (VARCHAR(80)),\\n Products.product_details (VARCHAR(255)),\\n)\\n\\nTable Shipment_Items (\\n Shipment_Items.shipment_id (INTEGER),\\n Shipment_Items.order_item_id (INTEGER),\\n)\\n\\nTable Shipments (\\n Shipments.shipment_id (INTEGER),\\n Shipments.order_id (INTEGER),\\n Shipments.invoice_number (INTEGER),\\n Shipments.shipment_tracking_number (VARCHAR(80)),\\n Shipments.shipment_date (DATETIME),\\n Shipments.other_shipment_details (VARCHAR(255)),\\n)\\n\\n\\nPossible JOINs:\\n\\nOrder_Items.product_id = Products.product_id\\nOrder_Items.order_id = Orders.order_id\\n\\nOrders.customer_id = Customers.customer_id\\n\\nShipment_Items.shipment_id = Shipments.shipment_id\\nShipment_Items.order_item_id = Order_Items.order_item_id\\n\\nShipments.order_id = Orders.order_id\\nShipments.invoice_number = Invoices.invoice_number\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_llm_columns_min_ct\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 147,\n \"samples\": [\n \"CREATE TABLE country (\\n country.country_id (INT),\\n country.name (TEXT),\\n country.population (INT),\\n country.area (INT),\\n country.languages (TEXT),\\n)\\n\\nCREATE TABLE roller_coaster (\\n roller_coaster.roller_coaster_id (INT),\\n roller_coaster.name (TEXT),\\n roller_coaster.park (TEXT),\\n roller_coaster.country_id (INT),\\n roller_coaster.length (REAL),\\n roller_coaster.height (REAL),\\n roller_coaster.speed (TEXT),\\n roller_coaster.opened (TEXT),\\n roller_coaster.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nroller_coaster.country_id = country.country_id\\n\",\n \"CREATE TABLE circuits (\\n circuits.circuitid (INTEGER),\\n circuits.circuitref (TEXT),\\n circuits.name (TEXT),\\n circuits.location (TEXT),\\n circuits.country (TEXT),\\n circuits.lat (REAL),\\n circuits.lng (REAL),\\n circuits.alt (TEXT),\\n circuits.url (TEXT),\\n)\\n\\nCREATE TABLE constructorResults (\\n constructorResults.constructorresultsid (INTEGER),\\n constructorResults.raceid (INTEGER),\\n constructorResults.constructorid (INTEGER),\\n constructorResults.points (REAL),\\n constructorResults.status (TEXT),\\n)\\n\\nCREATE TABLE constructorStandings (\\n constructorStandings.constructorstandingsid (INTEGER),\\n constructorStandings.raceid (INTEGER),\\n constructorStandings.constructorid (INTEGER),\\n constructorStandings.points (REAL),\\n constructorStandings.position (INTEGER),\\n constructorStandings.positiontext (TEXT),\\n constructorStandings.wins (INTEGER),\\n)\\n\\nCREATE TABLE constructors (\\n constructors.constructorid (INTEGER),\\n constructors.constructorref (TEXT),\\n constructors.name (TEXT),\\n constructors.nationality (TEXT),\\n constructors.url (TEXT),\\n)\\n\\nCREATE TABLE driverStandings (\\n driverStandings.driverstandingsid (INTEGER),\\n driverStandings.raceid (INTEGER),\\n driverStandings.driverid (INTEGER),\\n driverStandings.points (REAL),\\n driverStandings.position (INTEGER),\\n driverStandings.positiontext (TEXT),\\n driverStandings.wins (INTEGER),\\n)\\n\\nCREATE TABLE drivers (\\n drivers.driverid (INTEGER),\\n drivers.driverref (TEXT),\\n drivers.number (TEXT),\\n drivers.code (TEXT),\\n drivers.forename (TEXT),\\n drivers.surname (TEXT),\\n drivers.dob (TEXT),\\n drivers.nationality (TEXT),\\n drivers.url (TEXT),\\n)\\n\\nCREATE TABLE lapTimes (\\n lapTimes.raceid (INTEGER),\\n lapTimes.driverid (INTEGER),\\n lapTimes.lap (INTEGER),\\n lapTimes.position (INTEGER),\\n lapTimes.time (TEXT),\\n lapTimes.milliseconds (INTEGER),\\n)\\n\\nCREATE TABLE pitStops (\\n pitStops.raceid (INTEGER),\\n pitStops.driverid (INTEGER),\\n pitStops.stop (INTEGER),\\n pitStops.lap (INTEGER),\\n pitStops.time (TEXT),\\n pitStops.duration (TEXT),\\n pitStops.milliseconds (INTEGER),\\n)\\n\\nCREATE TABLE qualifying (\\n qualifying.qualifyid (INTEGER),\\n qualifying.raceid (INTEGER),\\n qualifying.driverid (INTEGER),\\n qualifying.constructorid (INTEGER),\\n qualifying.number (INTEGER),\\n qualifying.position (INTEGER),\\n qualifying.q1 (TEXT),\\n qualifying.q2 (TEXT),\\n qualifying.q3 (TEXT),\\n)\\n\\nCREATE TABLE races (\\n races.raceid (INTEGER),\\n races.year (INTEGER),\\n races.round (INTEGER),\\n races.circuitid (INTEGER),\\n races.name (TEXT),\\n races.date (TEXT),\\n races.time (TEXT),\\n races.url (TEXT),\\n)\\n\\nCREATE TABLE results (\\n results.resultid (INTEGER),\\n results.raceid (INTEGER),\\n results.driverid (INTEGER),\\n results.constructorid (INTEGER),\\n results.number (INTEGER),\\n results.grid (INTEGER),\\n results.position (TEXT),\\n results.positiontext (TEXT),\\n results.positionorder (INTEGER),\\n results.points (REAL),\\n results.laps (TEXT),\\n results.time (TEXT),\\n results.milliseconds (TEXT),\\n results.fastestlap (TEXT),\\n results.rank (TEXT),\\n results.fastestlaptime (TEXT),\\n results.fastestlapspeed (TEXT),\\n results.statusid (INTEGER),\\n)\\n\\nCREATE TABLE seasons (\\n seasons.year (INTEGER),\\n seasons.url (TEXT),\\n)\\n\\nCREATE TABLE status (\\n status.statusid (INTEGER),\\n status.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nconstructorResults.raceid = races.raceid\\nconstructorResults.constructorid = constructors.constructorid\\n\\nconstructorStandings.raceid = races.raceid\\nconstructorStandings.constructorid = constructors.constructorid\\n\\ndriverStandings.raceid = races.raceid\\ndriverStandings.driverid = drivers.driverid\\n\\nlapTimes.raceid = races.raceid\\nlapTimes.driverid = drivers.driverid\\n\\npitStops.raceid = races.raceid\\npitStops.driverid = drivers.driverid\\n\\nqualifying.raceid = races.raceid\\nqualifying.driverid = drivers.driverid\\nqualifying.constructorid = constructors.constructorid\\n\\nraces.circuitid = circuits.circuitid\\n\\nresults.raceid = races.raceid\\nresults.driverid = drivers.driverid\\nresults.constructorid = constructors.constructorid\\n\",\n \"CREATE TABLE Customers (\\n Customers.customer_id (INTEGER),\\n Customers.customer_name (VARCHAR(80)),\\n Customers.customer_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Invoices (\\n Invoices.invoice_number (INTEGER),\\n Invoices.invoice_date (DATETIME),\\n Invoices.invoice_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Order_Items (\\n Order_Items.order_item_id (INTEGER),\\n Order_Items.product_id (INTEGER),\\n Order_Items.order_id (INTEGER),\\n Order_Items.order_item_status (VARCHAR(10)),\\n Order_Items.order_item_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Orders (\\n Orders.order_id (INTEGER),\\n Orders.customer_id (INTEGER),\\n Orders.order_status (VARCHAR(10)),\\n Orders.date_order_placed (DATETIME),\\n Orders.order_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Products (\\n Products.product_id (INTEGER),\\n Products.product_name (VARCHAR(80)),\\n Products.product_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE Shipment_Items (\\n Shipment_Items.shipment_id (INTEGER),\\n Shipment_Items.order_item_id (INTEGER),\\n)\\n\\nCREATE TABLE Shipments (\\n Shipments.shipment_id (INTEGER),\\n Shipments.order_id (INTEGER),\\n Shipments.invoice_number (INTEGER),\\n Shipments.shipment_tracking_number (VARCHAR(80)),\\n Shipments.shipment_date (DATETIME),\\n Shipments.other_shipment_details (VARCHAR(255)),\\n)\\n\\n\\nPossible JOINs:\\n\\nOrder_Items.product_id = Products.product_id\\nOrder_Items.order_id = Orders.order_id\\n\\nOrders.customer_id = Customers.customer_id\\n\\nShipment_Items.shipment_id = Shipments.shipment_id\\nShipment_Items.order_item_id = Order_Items.order_item_id\\n\\nShipments.order_id = Orders.order_id\\nShipments.invoice_number = Invoices.invoice_number\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_llm_all_min\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 147,\n \"samples\": [\n \"Table country (\\n country.country_id (INT),\\n country.name (TEXT),\\n country.population (INT),\\n country.area (INT),\\n country.languages (TEXT),\\n)\\n\\nTable roller_coaster (\\n roller_coaster.roller_coaster_id (INT),\\n roller_coaster.name (TEXT),\\n roller_coaster.park (TEXT),\\n roller_coaster.country_id (INT),\\n roller_coaster.length (REAL),\\n roller_coaster.height (REAL),\\n roller_coaster.speed (TEXT),\\n roller_coaster.opened (TEXT),\\n roller_coaster.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nroller_coaster.country_id = country.country_id\\n\",\n \"Table circuits (\\n circuits.circuitid (INTEGER),\\n circuits.circuitref (TEXT),\\n circuits.name (TEXT),\\n circuits.location (TEXT),\\n circuits.country (TEXT),\\n circuits.lat (REAL),\\n circuits.lng (REAL),\\n circuits.alt (TEXT),\\n circuits.url (TEXT),\\n)\\n\\nTable constructorresults (\\n constructorresults.constructorresultsid (INTEGER),\\n constructorresults.raceid (INTEGER),\\n constructorresults.constructorid (INTEGER),\\n constructorresults.points (REAL),\\n constructorresults.status (TEXT),\\n)\\n\\nTable constructorstandings (\\n constructorstandings.constructorstandingsid (INTEGER),\\n constructorstandings.raceid (INTEGER),\\n constructorstandings.constructorid (INTEGER),\\n constructorstandings.points (REAL),\\n constructorstandings.position (INTEGER),\\n constructorstandings.positiontext (TEXT),\\n constructorstandings.wins (INTEGER),\\n)\\n\\nTable constructors (\\n constructors.constructorid (INTEGER),\\n constructors.constructorref (TEXT),\\n constructors.name (TEXT),\\n constructors.nationality (TEXT),\\n constructors.url (TEXT),\\n)\\n\\nTable driverstandings (\\n driverstandings.driverstandingsid (INTEGER),\\n driverstandings.raceid (INTEGER),\\n driverstandings.driverid (INTEGER),\\n driverstandings.points (REAL),\\n driverstandings.position (INTEGER),\\n driverstandings.positiontext (TEXT),\\n driverstandings.wins (INTEGER),\\n)\\n\\nTable drivers (\\n drivers.driverid (INTEGER),\\n drivers.driverref (TEXT),\\n drivers.number (TEXT),\\n drivers.code (TEXT),\\n drivers.forename (TEXT),\\n drivers.surname (TEXT),\\n drivers.dob (TEXT),\\n drivers.nationality (TEXT),\\n drivers.url (TEXT),\\n)\\n\\nTable laptimes (\\n laptimes.raceid (INTEGER),\\n laptimes.driverid (INTEGER),\\n laptimes.lap (INTEGER),\\n laptimes.position (INTEGER),\\n laptimes.time (TEXT),\\n laptimes.milliseconds (INTEGER),\\n)\\n\\nTable pitstops (\\n pitstops.raceid (INTEGER),\\n pitstops.driverid (INTEGER),\\n pitstops.stop (INTEGER),\\n pitstops.lap (INTEGER),\\n pitstops.time (TEXT),\\n pitstops.duration (TEXT),\\n pitstops.milliseconds (INTEGER),\\n)\\n\\nTable qualifying (\\n qualifying.qualifyid (INTEGER),\\n qualifying.raceid (INTEGER),\\n qualifying.driverid (INTEGER),\\n qualifying.constructorid (INTEGER),\\n qualifying.number (INTEGER),\\n qualifying.position (INTEGER),\\n qualifying.q1 (TEXT),\\n qualifying.q2 (TEXT),\\n qualifying.q3 (TEXT),\\n)\\n\\nTable races (\\n races.raceid (INTEGER),\\n races.year (INTEGER),\\n races.round (INTEGER),\\n races.circuitid (INTEGER),\\n races.name (TEXT),\\n races.date (TEXT),\\n races.time (TEXT),\\n races.url (TEXT),\\n)\\n\\nTable results (\\n results.resultid (INTEGER),\\n results.raceid (INTEGER),\\n results.driverid (INTEGER),\\n results.constructorid (INTEGER),\\n results.number (INTEGER),\\n results.grid (INTEGER),\\n results.position (TEXT),\\n results.positiontext (TEXT),\\n results.positionorder (INTEGER),\\n results.points (REAL),\\n results.laps (TEXT),\\n results.time (TEXT),\\n results.milliseconds (TEXT),\\n results.fastestlap (TEXT),\\n results.rank (TEXT),\\n results.fastestlaptime (TEXT),\\n results.fastestlapspeed (TEXT),\\n results.statusid (INTEGER),\\n)\\n\\nTable seasons (\\n seasons.year (INTEGER),\\n seasons.url (TEXT),\\n)\\n\\nTable status (\\n status.statusid (INTEGER),\\n status.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nconstructorresults.raceid = races.raceid\\nconstructorresults.constructorid = constructors.constructorid\\n\\nconstructorstandings.raceid = races.raceid\\nconstructorstandings.constructorid = constructors.constructorid\\n\\ndriverstandings.raceid = races.raceid\\ndriverstandings.driverid = drivers.driverid\\n\\nlaptimes.raceid = races.raceid\\nlaptimes.driverid = drivers.driverid\\n\\npitstops.raceid = races.raceid\\npitstops.driverid = drivers.driverid\\n\\nqualifying.raceid = races.raceid\\nqualifying.driverid = drivers.driverid\\nqualifying.constructorid = constructors.constructorid\\n\\nraces.circuitid = circuits.circuitid\\n\\nresults.raceid = races.raceid\\nresults.driverid = drivers.driverid\\nresults.constructorid = constructors.constructorid\\n\",\n \"Table customers (\\n customers.customer_id (INTEGER),\\n customers.customer_name (VARCHAR(80)),\\n customers.customer_details (VARCHAR(255)),\\n)\\n\\nTable invoices (\\n invoices.invoice_number (INTEGER),\\n invoices.invoice_date (DATETIME),\\n invoices.invoice_details (VARCHAR(255)),\\n)\\n\\nTable order_items (\\n order_items.order_item_id (INTEGER),\\n order_items.product_id (INTEGER),\\n order_items.order_id (INTEGER),\\n order_items.order_item_status (VARCHAR(10)),\\n order_items.order_item_details (VARCHAR(255)),\\n)\\n\\nTable orders (\\n orders.order_id (INTEGER),\\n orders.customer_id (INTEGER),\\n orders.order_status (VARCHAR(10)),\\n orders.date_order_placed (DATETIME),\\n orders.order_details (VARCHAR(255)),\\n)\\n\\nTable products (\\n products.product_id (INTEGER),\\n products.product_name (VARCHAR(80)),\\n products.product_details (VARCHAR(255)),\\n)\\n\\nTable shipment_items (\\n shipment_items.shipment_id (INTEGER),\\n shipment_items.order_item_id (INTEGER),\\n)\\n\\nTable shipments (\\n shipments.shipment_id (INTEGER),\\n shipments.order_id (INTEGER),\\n shipments.invoice_number (INTEGER),\\n shipments.shipment_tracking_number (VARCHAR(80)),\\n shipments.shipment_date (DATETIME),\\n shipments.other_shipment_details (VARCHAR(255)),\\n)\\n\\n\\nPossible JOINs:\\n\\norder_items.product_id = products.product_id\\norder_items.order_id = orders.order_id\\n\\norders.customer_id = customers.customer_id\\n\\nshipment_items.shipment_id = shipments.shipment_id\\nshipment_items.order_item_id = order_items.order_item_id\\n\\nshipments.order_id = orders.order_id\\nshipments.invoice_number = invoices.invoice_number\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_llm_all_min_ct\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 147,\n \"samples\": [\n \"CREATE TABLE country (\\n country.country_id (INT),\\n country.name (TEXT),\\n country.population (INT),\\n country.area (INT),\\n country.languages (TEXT),\\n)\\n\\nCREATE TABLE roller_coaster (\\n roller_coaster.roller_coaster_id (INT),\\n roller_coaster.name (TEXT),\\n roller_coaster.park (TEXT),\\n roller_coaster.country_id (INT),\\n roller_coaster.length (REAL),\\n roller_coaster.height (REAL),\\n roller_coaster.speed (TEXT),\\n roller_coaster.opened (TEXT),\\n roller_coaster.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nroller_coaster.country_id = country.country_id\\n\",\n \"CREATE TABLE circuits (\\n circuits.circuitid (INTEGER),\\n circuits.circuitref (TEXT),\\n circuits.name (TEXT),\\n circuits.location (TEXT),\\n circuits.country (TEXT),\\n circuits.lat (REAL),\\n circuits.lng (REAL),\\n circuits.alt (TEXT),\\n circuits.url (TEXT),\\n)\\n\\nCREATE TABLE constructorresults (\\n constructorresults.constructorresultsid (INTEGER),\\n constructorresults.raceid (INTEGER),\\n constructorresults.constructorid (INTEGER),\\n constructorresults.points (REAL),\\n constructorresults.status (TEXT),\\n)\\n\\nCREATE TABLE constructorstandings (\\n constructorstandings.constructorstandingsid (INTEGER),\\n constructorstandings.raceid (INTEGER),\\n constructorstandings.constructorid (INTEGER),\\n constructorstandings.points (REAL),\\n constructorstandings.position (INTEGER),\\n constructorstandings.positiontext (TEXT),\\n constructorstandings.wins (INTEGER),\\n)\\n\\nCREATE TABLE constructors (\\n constructors.constructorid (INTEGER),\\n constructors.constructorref (TEXT),\\n constructors.name (TEXT),\\n constructors.nationality (TEXT),\\n constructors.url (TEXT),\\n)\\n\\nCREATE TABLE driverstandings (\\n driverstandings.driverstandingsid (INTEGER),\\n driverstandings.raceid (INTEGER),\\n driverstandings.driverid (INTEGER),\\n driverstandings.points (REAL),\\n driverstandings.position (INTEGER),\\n driverstandings.positiontext (TEXT),\\n driverstandings.wins (INTEGER),\\n)\\n\\nCREATE TABLE drivers (\\n drivers.driverid (INTEGER),\\n drivers.driverref (TEXT),\\n drivers.number (TEXT),\\n drivers.code (TEXT),\\n drivers.forename (TEXT),\\n drivers.surname (TEXT),\\n drivers.dob (TEXT),\\n drivers.nationality (TEXT),\\n drivers.url (TEXT),\\n)\\n\\nCREATE TABLE laptimes (\\n laptimes.raceid (INTEGER),\\n laptimes.driverid (INTEGER),\\n laptimes.lap (INTEGER),\\n laptimes.position (INTEGER),\\n laptimes.time (TEXT),\\n laptimes.milliseconds (INTEGER),\\n)\\n\\nCREATE TABLE pitstops (\\n pitstops.raceid (INTEGER),\\n pitstops.driverid (INTEGER),\\n pitstops.stop (INTEGER),\\n pitstops.lap (INTEGER),\\n pitstops.time (TEXT),\\n pitstops.duration (TEXT),\\n pitstops.milliseconds (INTEGER),\\n)\\n\\nCREATE TABLE qualifying (\\n qualifying.qualifyid (INTEGER),\\n qualifying.raceid (INTEGER),\\n qualifying.driverid (INTEGER),\\n qualifying.constructorid (INTEGER),\\n qualifying.number (INTEGER),\\n qualifying.position (INTEGER),\\n qualifying.q1 (TEXT),\\n qualifying.q2 (TEXT),\\n qualifying.q3 (TEXT),\\n)\\n\\nCREATE TABLE races (\\n races.raceid (INTEGER),\\n races.year (INTEGER),\\n races.round (INTEGER),\\n races.circuitid (INTEGER),\\n races.name (TEXT),\\n races.date (TEXT),\\n races.time (TEXT),\\n races.url (TEXT),\\n)\\n\\nCREATE TABLE results (\\n results.resultid (INTEGER),\\n results.raceid (INTEGER),\\n results.driverid (INTEGER),\\n results.constructorid (INTEGER),\\n results.number (INTEGER),\\n results.grid (INTEGER),\\n results.position (TEXT),\\n results.positiontext (TEXT),\\n results.positionorder (INTEGER),\\n results.points (REAL),\\n results.laps (TEXT),\\n results.time (TEXT),\\n results.milliseconds (TEXT),\\n results.fastestlap (TEXT),\\n results.rank (TEXT),\\n results.fastestlaptime (TEXT),\\n results.fastestlapspeed (TEXT),\\n results.statusid (INTEGER),\\n)\\n\\nCREATE TABLE seasons (\\n seasons.year (INTEGER),\\n seasons.url (TEXT),\\n)\\n\\nCREATE TABLE status (\\n status.statusid (INTEGER),\\n status.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nconstructorresults.raceid = races.raceid\\nconstructorresults.constructorid = constructors.constructorid\\n\\nconstructorstandings.raceid = races.raceid\\nconstructorstandings.constructorid = constructors.constructorid\\n\\ndriverstandings.raceid = races.raceid\\ndriverstandings.driverid = drivers.driverid\\n\\nlaptimes.raceid = races.raceid\\nlaptimes.driverid = drivers.driverid\\n\\npitstops.raceid = races.raceid\\npitstops.driverid = drivers.driverid\\n\\nqualifying.raceid = races.raceid\\nqualifying.driverid = drivers.driverid\\nqualifying.constructorid = constructors.constructorid\\n\\nraces.circuitid = circuits.circuitid\\n\\nresults.raceid = races.raceid\\nresults.driverid = drivers.driverid\\nresults.constructorid = constructors.constructorid\\n\",\n \"CREATE TABLE customers (\\n customers.customer_id (INTEGER),\\n customers.customer_name (VARCHAR(80)),\\n customers.customer_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE invoices (\\n invoices.invoice_number (INTEGER),\\n invoices.invoice_date (DATETIME),\\n invoices.invoice_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE order_items (\\n order_items.order_item_id (INTEGER),\\n order_items.product_id (INTEGER),\\n order_items.order_id (INTEGER),\\n order_items.order_item_status (VARCHAR(10)),\\n order_items.order_item_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE orders (\\n orders.order_id (INTEGER),\\n orders.customer_id (INTEGER),\\n orders.order_status (VARCHAR(10)),\\n orders.date_order_placed (DATETIME),\\n orders.order_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE products (\\n products.product_id (INTEGER),\\n products.product_name (VARCHAR(80)),\\n products.product_details (VARCHAR(255)),\\n)\\n\\nCREATE TABLE shipment_items (\\n shipment_items.shipment_id (INTEGER),\\n shipment_items.order_item_id (INTEGER),\\n)\\n\\nCREATE TABLE shipments (\\n shipments.shipment_id (INTEGER),\\n shipments.order_id (INTEGER),\\n shipments.invoice_number (INTEGER),\\n shipments.shipment_tracking_number (VARCHAR(80)),\\n shipments.shipment_date (DATETIME),\\n shipments.other_shipment_details (VARCHAR(255)),\\n)\\n\\n\\nPossible JOINs:\\n\\norder_items.product_id = products.product_id\\norder_items.order_id = orders.order_id\\n\\norders.customer_id = customers.customer_id\\n\\nshipment_items.shipment_id = shipments.shipment_id\\nshipment_items.order_item_id = order_items.order_item_id\\n\\nshipments.order_id = orders.order_id\\nshipments.invoice_number = invoices.invoice_number\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_dict\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 146,\n \"samples\": [\n \"{\\n 'company': ['Company_ID', 'Rank', 'Company', 'Headquarters', 'Main_Industry', 'Sales_billion', 'Profits_billion', 'Assets_billion', 'Market_Value'],\\n 'gas_station': ['Station_ID', 'Open_Year', 'Location', 'Manager_Name', 'Vice_Manager_Name', 'Representative_Name'],\\n 'station_company': ['Station_ID', 'Company_ID', 'Rank_of_the_Year']\\n}\",\n \"{\\n 'Premises': ['premise_id', 'premises_type', 'premise_details'],\\n 'Products': ['product_id', 'product_category', 'product_name'],\\n 'Customers': ['customer_id', 'payment_method', 'customer_name', 'customer_phone', 'customer_email', 'customer_address', 'customer_login', 'customer_password'],\\n 'Mailshot_Campaigns': ['mailshot_id', 'product_category', 'mailshot_name', 'mailshot_start_date', 'mailshot_end_date'],\\n 'Customer_Addresses': ['customer_id', 'premise_id', 'date_address_from', 'address_type_code', 'date_address_to'],\\n 'Customer_Orders': ['order_id', 'customer_id', 'order_status_code', 'shipping_method_code', 'order_placed_datetime', 'order_delivered_datetime', 'order_shipping_charges'],\\n 'Mailshot_Customers': ['mailshot_id', 'customer_id', 'outcome_code', 'mailshot_customer_date'],\\n 'Order_Items': ['item_id', 'order_item_status_code', 'order_id', 'product_id', 'item_status_code', 'item_delivered_datetime', 'item_order_quantity']\\n}\",\n \"{\\n 'member': ['Member_ID', 'Name', 'Nationality', 'Role'],\\n 'performance': ['Performance_ID', 'Date', 'Host', 'Location', 'Attendance'],\\n 'member_attendance': ['Member_ID', 'Performance_ID', 'Num_of_Pieces']\\n}\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"selector_correct\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 3373,\n \"samples\": [\n \"{\\n 'user': ['uid', 'user_id', 'name'],\\n 'review': ['rid', 'user_id', 'rating']\\n}\",\n \"{\\n 'Documents': ['document_id', 'document_status_code', 'document_type_code']\\n}\",\n \"{\\n 'state': ['state_name', 'population'],\\n 'highlow': ['state_name', 'highest_point']\\n}\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_llm_t\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 147,\n \"samples\": [\n \"TABLE country (\\n country.Country_ID (INT),\\n country.Name (TEXT),\\n country.Population (INT),\\n country.Area (INT),\\n country.Languages (TEXT),\\n)\\n\\nTABLE roller_coaster (\\n roller_coaster.Roller_Coaster_ID (INT),\\n roller_coaster.Name (TEXT),\\n roller_coaster.Park (TEXT),\\n roller_coaster.Country_ID (INT),\\n roller_coaster.Length (REAL),\\n roller_coaster.Height (REAL),\\n roller_coaster.Speed (TEXT),\\n roller_coaster.Opened (TEXT),\\n roller_coaster.Status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nroller_coaster.Country_ID = country.Country_ID\\n\",\n \"TABLE circuits (\\n circuits.circuitId (INTEGER),\\n circuits.circuitRef (TEXT),\\n circuits.name (TEXT),\\n circuits.location (TEXT),\\n circuits.country (TEXT),\\n circuits.lat (REAL),\\n circuits.lng (REAL),\\n circuits.alt (TEXT),\\n circuits.url (TEXT),\\n)\\n\\nTABLE constructorResults (\\n constructorResults.constructorResultsId (INTEGER),\\n constructorResults.raceId (INTEGER),\\n constructorResults.constructorId (INTEGER),\\n constructorResults.points (REAL),\\n constructorResults.status (TEXT),\\n)\\n\\nTABLE constructorStandings (\\n constructorStandings.constructorStandingsId (INTEGER),\\n constructorStandings.raceId (INTEGER),\\n constructorStandings.constructorId (INTEGER),\\n constructorStandings.points (REAL),\\n constructorStandings.position (INTEGER),\\n constructorStandings.positionText (TEXT),\\n constructorStandings.wins (INTEGER),\\n)\\n\\nTABLE constructors (\\n constructors.constructorId (INTEGER),\\n constructors.constructorRef (TEXT),\\n constructors.name (TEXT),\\n constructors.nationality (TEXT),\\n constructors.url (TEXT),\\n)\\n\\nTABLE driverStandings (\\n driverStandings.driverStandingsId (INTEGER),\\n driverStandings.raceId (INTEGER),\\n driverStandings.driverId (INTEGER),\\n driverStandings.points (REAL),\\n driverStandings.position (INTEGER),\\n driverStandings.positionText (TEXT),\\n driverStandings.wins (INTEGER),\\n)\\n\\nTABLE drivers (\\n drivers.driverId (INTEGER),\\n drivers.driverRef (TEXT),\\n drivers.number (TEXT),\\n drivers.code (TEXT),\\n drivers.forename (TEXT),\\n drivers.surname (TEXT),\\n drivers.dob (TEXT),\\n drivers.nationality (TEXT),\\n drivers.url (TEXT),\\n)\\n\\nTABLE lapTimes (\\n lapTimes.raceId (INTEGER),\\n lapTimes.driverId (INTEGER),\\n lapTimes.lap (INTEGER),\\n lapTimes.position (INTEGER),\\n lapTimes.time (TEXT),\\n lapTimes.milliseconds (INTEGER),\\n)\\n\\nTABLE pitStops (\\n pitStops.raceId (INTEGER),\\n pitStops.driverId (INTEGER),\\n pitStops.stop (INTEGER),\\n pitStops.lap (INTEGER),\\n pitStops.time (TEXT),\\n pitStops.duration (TEXT),\\n pitStops.milliseconds (INTEGER),\\n)\\n\\nTABLE qualifying (\\n qualifying.qualifyId (INTEGER),\\n qualifying.raceId (INTEGER),\\n qualifying.driverId (INTEGER),\\n qualifying.constructorId (INTEGER),\\n qualifying.number (INTEGER),\\n qualifying.position (INTEGER),\\n qualifying.q1 (TEXT),\\n qualifying.q2 (TEXT),\\n qualifying.q3 (TEXT),\\n)\\n\\nTABLE races (\\n races.raceId (INTEGER),\\n races.year (INTEGER),\\n races.round (INTEGER),\\n races.circuitId (INTEGER),\\n races.name (TEXT),\\n races.date (TEXT),\\n races.time (TEXT),\\n races.url (TEXT),\\n)\\n\\nTABLE results (\\n results.resultId (INTEGER),\\n results.raceId (INTEGER),\\n results.driverId (INTEGER),\\n results.constructorId (INTEGER),\\n results.number (INTEGER),\\n results.grid (INTEGER),\\n results.position (TEXT),\\n results.positionText (TEXT),\\n results.positionOrder (INTEGER),\\n results.points (REAL),\\n results.laps (TEXT),\\n results.time (TEXT),\\n results.milliseconds (TEXT),\\n results.fastestLap (TEXT),\\n results.rank (TEXT),\\n results.fastestLapTime (TEXT),\\n results.fastestLapSpeed (TEXT),\\n results.statusId (INTEGER),\\n)\\n\\nTABLE seasons (\\n seasons.year (INTEGER),\\n seasons.url (TEXT),\\n)\\n\\nTABLE status (\\n status.statusId (INTEGER),\\n status.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nconstructorResults.raceId = races.raceId\\nconstructorResults.constructorId = constructors.constructorId\\n\\nconstructorStandings.raceId = races.raceId\\nconstructorStandings.constructorId = constructors.constructorId\\n\\ndriverStandings.raceId = races.raceId\\ndriverStandings.driverId = drivers.driverId\\n\\nlapTimes.raceId = races.raceId\\nlapTimes.driverId = drivers.driverId\\n\\npitStops.raceId = races.raceId\\npitStops.driverId = drivers.driverId\\n\\nqualifying.raceId = races.raceId\\nqualifying.driverId = drivers.driverId\\nqualifying.constructorId = constructors.constructorId\\n\\nraces.circuitId = circuits.circuitId\\n\\nresults.raceId = races.raceId\\nresults.driverId = drivers.driverId\\nresults.constructorId = constructors.constructorId\\n\",\n \"TABLE Customers (\\n Customers.customer_id (INTEGER),\\n Customers.customer_name (VARCHAR(80)),\\n Customers.customer_details (VARCHAR(255)),\\n)\\n\\nTABLE Invoices (\\n Invoices.invoice_number (INTEGER),\\n Invoices.invoice_date (DATETIME),\\n Invoices.invoice_details (VARCHAR(255)),\\n)\\n\\nTABLE Order_Items (\\n Order_Items.order_item_id (INTEGER),\\n Order_Items.product_id (INTEGER),\\n Order_Items.order_id (INTEGER),\\n Order_Items.order_item_status (VARCHAR(10)),\\n Order_Items.order_item_details (VARCHAR(255)),\\n)\\n\\nTABLE Orders (\\n Orders.order_id (INTEGER),\\n Orders.customer_id (INTEGER),\\n Orders.order_status (VARCHAR(10)),\\n Orders.date_order_placed (DATETIME),\\n Orders.order_details (VARCHAR(255)),\\n)\\n\\nTABLE Products (\\n Products.product_id (INTEGER),\\n Products.product_name (VARCHAR(80)),\\n Products.product_details (VARCHAR(255)),\\n)\\n\\nTABLE Shipment_Items (\\n Shipment_Items.shipment_id (INTEGER),\\n Shipment_Items.order_item_id (INTEGER),\\n)\\n\\nTABLE Shipments (\\n Shipments.shipment_id (INTEGER),\\n Shipments.order_id (INTEGER),\\n Shipments.invoice_number (INTEGER),\\n Shipments.shipment_tracking_number (VARCHAR(80)),\\n Shipments.shipment_date (DATETIME),\\n Shipments.other_shipment_details (VARCHAR(255)),\\n)\\n\\n\\nPossible JOINs:\\n\\nOrder_Items.product_id = Products.product_id\\nOrder_Items.order_id = Orders.order_id\\n\\nOrders.customer_id = Customers.customer_id\\n\\nShipment_Items.shipment_id = Shipments.shipment_id\\nShipment_Items.order_item_id = Order_Items.order_item_id\\n\\nShipments.order_id = Orders.order_id\\nShipments.invoice_number = Invoices.invoice_number\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_llm_columns_min_t\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 147,\n \"samples\": [\n \"TABLE country (\\n country.country_id (INT),\\n country.name (TEXT),\\n country.population (INT),\\n country.area (INT),\\n country.languages (TEXT),\\n)\\n\\nTABLE roller_coaster (\\n roller_coaster.roller_coaster_id (INT),\\n roller_coaster.name (TEXT),\\n roller_coaster.park (TEXT),\\n roller_coaster.country_id (INT),\\n roller_coaster.length (REAL),\\n roller_coaster.height (REAL),\\n roller_coaster.speed (TEXT),\\n roller_coaster.opened (TEXT),\\n roller_coaster.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nroller_coaster.country_id = country.country_id\\n\",\n \"TABLE circuits (\\n circuits.circuitid (INTEGER),\\n circuits.circuitref (TEXT),\\n circuits.name (TEXT),\\n circuits.location (TEXT),\\n circuits.country (TEXT),\\n circuits.lat (REAL),\\n circuits.lng (REAL),\\n circuits.alt (TEXT),\\n circuits.url (TEXT),\\n)\\n\\nTABLE constructorResults (\\n constructorResults.constructorresultsid (INTEGER),\\n constructorResults.raceid (INTEGER),\\n constructorResults.constructorid (INTEGER),\\n constructorResults.points (REAL),\\n constructorResults.status (TEXT),\\n)\\n\\nTABLE constructorStandings (\\n constructorStandings.constructorstandingsid (INTEGER),\\n constructorStandings.raceid (INTEGER),\\n constructorStandings.constructorid (INTEGER),\\n constructorStandings.points (REAL),\\n constructorStandings.position (INTEGER),\\n constructorStandings.positiontext (TEXT),\\n constructorStandings.wins (INTEGER),\\n)\\n\\nTABLE constructors (\\n constructors.constructorid (INTEGER),\\n constructors.constructorref (TEXT),\\n constructors.name (TEXT),\\n constructors.nationality (TEXT),\\n constructors.url (TEXT),\\n)\\n\\nTABLE driverStandings (\\n driverStandings.driverstandingsid (INTEGER),\\n driverStandings.raceid (INTEGER),\\n driverStandings.driverid (INTEGER),\\n driverStandings.points (REAL),\\n driverStandings.position (INTEGER),\\n driverStandings.positiontext (TEXT),\\n driverStandings.wins (INTEGER),\\n)\\n\\nTABLE drivers (\\n drivers.driverid (INTEGER),\\n drivers.driverref (TEXT),\\n drivers.number (TEXT),\\n drivers.code (TEXT),\\n drivers.forename (TEXT),\\n drivers.surname (TEXT),\\n drivers.dob (TEXT),\\n drivers.nationality (TEXT),\\n drivers.url (TEXT),\\n)\\n\\nTABLE lapTimes (\\n lapTimes.raceid (INTEGER),\\n lapTimes.driverid (INTEGER),\\n lapTimes.lap (INTEGER),\\n lapTimes.position (INTEGER),\\n lapTimes.time (TEXT),\\n lapTimes.milliseconds (INTEGER),\\n)\\n\\nTABLE pitStops (\\n pitStops.raceid (INTEGER),\\n pitStops.driverid (INTEGER),\\n pitStops.stop (INTEGER),\\n pitStops.lap (INTEGER),\\n pitStops.time (TEXT),\\n pitStops.duration (TEXT),\\n pitStops.milliseconds (INTEGER),\\n)\\n\\nTABLE qualifying (\\n qualifying.qualifyid (INTEGER),\\n qualifying.raceid (INTEGER),\\n qualifying.driverid (INTEGER),\\n qualifying.constructorid (INTEGER),\\n qualifying.number (INTEGER),\\n qualifying.position (INTEGER),\\n qualifying.q1 (TEXT),\\n qualifying.q2 (TEXT),\\n qualifying.q3 (TEXT),\\n)\\n\\nTABLE races (\\n races.raceid (INTEGER),\\n races.year (INTEGER),\\n races.round (INTEGER),\\n races.circuitid (INTEGER),\\n races.name (TEXT),\\n races.date (TEXT),\\n races.time (TEXT),\\n races.url (TEXT),\\n)\\n\\nTABLE results (\\n results.resultid (INTEGER),\\n results.raceid (INTEGER),\\n results.driverid (INTEGER),\\n results.constructorid (INTEGER),\\n results.number (INTEGER),\\n results.grid (INTEGER),\\n results.position (TEXT),\\n results.positiontext (TEXT),\\n results.positionorder (INTEGER),\\n results.points (REAL),\\n results.laps (TEXT),\\n results.time (TEXT),\\n results.milliseconds (TEXT),\\n results.fastestlap (TEXT),\\n results.rank (TEXT),\\n results.fastestlaptime (TEXT),\\n results.fastestlapspeed (TEXT),\\n results.statusid (INTEGER),\\n)\\n\\nTABLE seasons (\\n seasons.year (INTEGER),\\n seasons.url (TEXT),\\n)\\n\\nTABLE status (\\n status.statusid (INTEGER),\\n status.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nconstructorResults.raceid = races.raceid\\nconstructorResults.constructorid = constructors.constructorid\\n\\nconstructorStandings.raceid = races.raceid\\nconstructorStandings.constructorid = constructors.constructorid\\n\\ndriverStandings.raceid = races.raceid\\ndriverStandings.driverid = drivers.driverid\\n\\nlapTimes.raceid = races.raceid\\nlapTimes.driverid = drivers.driverid\\n\\npitStops.raceid = races.raceid\\npitStops.driverid = drivers.driverid\\n\\nqualifying.raceid = races.raceid\\nqualifying.driverid = drivers.driverid\\nqualifying.constructorid = constructors.constructorid\\n\\nraces.circuitid = circuits.circuitid\\n\\nresults.raceid = races.raceid\\nresults.driverid = drivers.driverid\\nresults.constructorid = constructors.constructorid\\n\",\n \"TABLE Customers (\\n Customers.customer_id (INTEGER),\\n Customers.customer_name (VARCHAR(80)),\\n Customers.customer_details (VARCHAR(255)),\\n)\\n\\nTABLE Invoices (\\n Invoices.invoice_number (INTEGER),\\n Invoices.invoice_date (DATETIME),\\n Invoices.invoice_details (VARCHAR(255)),\\n)\\n\\nTABLE Order_Items (\\n Order_Items.order_item_id (INTEGER),\\n Order_Items.product_id (INTEGER),\\n Order_Items.order_id (INTEGER),\\n Order_Items.order_item_status (VARCHAR(10)),\\n Order_Items.order_item_details (VARCHAR(255)),\\n)\\n\\nTABLE Orders (\\n Orders.order_id (INTEGER),\\n Orders.customer_id (INTEGER),\\n Orders.order_status (VARCHAR(10)),\\n Orders.date_order_placed (DATETIME),\\n Orders.order_details (VARCHAR(255)),\\n)\\n\\nTABLE Products (\\n Products.product_id (INTEGER),\\n Products.product_name (VARCHAR(80)),\\n Products.product_details (VARCHAR(255)),\\n)\\n\\nTABLE Shipment_Items (\\n Shipment_Items.shipment_id (INTEGER),\\n Shipment_Items.order_item_id (INTEGER),\\n)\\n\\nTABLE Shipments (\\n Shipments.shipment_id (INTEGER),\\n Shipments.order_id (INTEGER),\\n Shipments.invoice_number (INTEGER),\\n Shipments.shipment_tracking_number (VARCHAR(80)),\\n Shipments.shipment_date (DATETIME),\\n Shipments.other_shipment_details (VARCHAR(255)),\\n)\\n\\n\\nPossible JOINs:\\n\\nOrder_Items.product_id = Products.product_id\\nOrder_Items.order_id = Orders.order_id\\n\\nOrders.customer_id = Customers.customer_id\\n\\nShipment_Items.shipment_id = Shipments.shipment_id\\nShipment_Items.order_item_id = Order_Items.order_item_id\\n\\nShipments.order_id = Orders.order_id\\nShipments.invoice_number = Invoices.invoice_number\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"schema_llm_all_min_t\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 147,\n \"samples\": [\n \"TABLE country (\\n country.country_id (INT),\\n country.name (TEXT),\\n country.population (INT),\\n country.area (INT),\\n country.languages (TEXT),\\n)\\n\\nTABLE roller_coaster (\\n roller_coaster.roller_coaster_id (INT),\\n roller_coaster.name (TEXT),\\n roller_coaster.park (TEXT),\\n roller_coaster.country_id (INT),\\n roller_coaster.length (REAL),\\n roller_coaster.height (REAL),\\n roller_coaster.speed (TEXT),\\n roller_coaster.opened (TEXT),\\n roller_coaster.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nroller_coaster.country_id = country.country_id\\n\",\n \"TABLE circuits (\\n circuits.circuitid (INTEGER),\\n circuits.circuitref (TEXT),\\n circuits.name (TEXT),\\n circuits.location (TEXT),\\n circuits.country (TEXT),\\n circuits.lat (REAL),\\n circuits.lng (REAL),\\n circuits.alt (TEXT),\\n circuits.url (TEXT),\\n)\\n\\nTABLE constructorresults (\\n constructorresults.constructorresultsid (INTEGER),\\n constructorresults.raceid (INTEGER),\\n constructorresults.constructorid (INTEGER),\\n constructorresults.points (REAL),\\n constructorresults.status (TEXT),\\n)\\n\\nTABLE constructorstandings (\\n constructorstandings.constructorstandingsid (INTEGER),\\n constructorstandings.raceid (INTEGER),\\n constructorstandings.constructorid (INTEGER),\\n constructorstandings.points (REAL),\\n constructorstandings.position (INTEGER),\\n constructorstandings.positiontext (TEXT),\\n constructorstandings.wins (INTEGER),\\n)\\n\\nTABLE constructors (\\n constructors.constructorid (INTEGER),\\n constructors.constructorref (TEXT),\\n constructors.name (TEXT),\\n constructors.nationality (TEXT),\\n constructors.url (TEXT),\\n)\\n\\nTABLE driverstandings (\\n driverstandings.driverstandingsid (INTEGER),\\n driverstandings.raceid (INTEGER),\\n driverstandings.driverid (INTEGER),\\n driverstandings.points (REAL),\\n driverstandings.position (INTEGER),\\n driverstandings.positiontext (TEXT),\\n driverstandings.wins (INTEGER),\\n)\\n\\nTABLE drivers (\\n drivers.driverid (INTEGER),\\n drivers.driverref (TEXT),\\n drivers.number (TEXT),\\n drivers.code (TEXT),\\n drivers.forename (TEXT),\\n drivers.surname (TEXT),\\n drivers.dob (TEXT),\\n drivers.nationality (TEXT),\\n drivers.url (TEXT),\\n)\\n\\nTABLE laptimes (\\n laptimes.raceid (INTEGER),\\n laptimes.driverid (INTEGER),\\n laptimes.lap (INTEGER),\\n laptimes.position (INTEGER),\\n laptimes.time (TEXT),\\n laptimes.milliseconds (INTEGER),\\n)\\n\\nTABLE pitstops (\\n pitstops.raceid (INTEGER),\\n pitstops.driverid (INTEGER),\\n pitstops.stop (INTEGER),\\n pitstops.lap (INTEGER),\\n pitstops.time (TEXT),\\n pitstops.duration (TEXT),\\n pitstops.milliseconds (INTEGER),\\n)\\n\\nTABLE qualifying (\\n qualifying.qualifyid (INTEGER),\\n qualifying.raceid (INTEGER),\\n qualifying.driverid (INTEGER),\\n qualifying.constructorid (INTEGER),\\n qualifying.number (INTEGER),\\n qualifying.position (INTEGER),\\n qualifying.q1 (TEXT),\\n qualifying.q2 (TEXT),\\n qualifying.q3 (TEXT),\\n)\\n\\nTABLE races (\\n races.raceid (INTEGER),\\n races.year (INTEGER),\\n races.round (INTEGER),\\n races.circuitid (INTEGER),\\n races.name (TEXT),\\n races.date (TEXT),\\n races.time (TEXT),\\n races.url (TEXT),\\n)\\n\\nTABLE results (\\n results.resultid (INTEGER),\\n results.raceid (INTEGER),\\n results.driverid (INTEGER),\\n results.constructorid (INTEGER),\\n results.number (INTEGER),\\n results.grid (INTEGER),\\n results.position (TEXT),\\n results.positiontext (TEXT),\\n results.positionorder (INTEGER),\\n results.points (REAL),\\n results.laps (TEXT),\\n results.time (TEXT),\\n results.milliseconds (TEXT),\\n results.fastestlap (TEXT),\\n results.rank (TEXT),\\n results.fastestlaptime (TEXT),\\n results.fastestlapspeed (TEXT),\\n results.statusid (INTEGER),\\n)\\n\\nTABLE seasons (\\n seasons.year (INTEGER),\\n seasons.url (TEXT),\\n)\\n\\nTABLE status (\\n status.statusid (INTEGER),\\n status.status (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nconstructorresults.raceid = races.raceid\\nconstructorresults.constructorid = constructors.constructorid\\n\\nconstructorstandings.raceid = races.raceid\\nconstructorstandings.constructorid = constructors.constructorid\\n\\ndriverstandings.raceid = races.raceid\\ndriverstandings.driverid = drivers.driverid\\n\\nlaptimes.raceid = races.raceid\\nlaptimes.driverid = drivers.driverid\\n\\npitstops.raceid = races.raceid\\npitstops.driverid = drivers.driverid\\n\\nqualifying.raceid = races.raceid\\nqualifying.driverid = drivers.driverid\\nqualifying.constructorid = constructors.constructorid\\n\\nraces.circuitid = circuits.circuitid\\n\\nresults.raceid = races.raceid\\nresults.driverid = drivers.driverid\\nresults.constructorid = constructors.constructorid\\n\",\n \"TABLE customers (\\n customers.customer_id (INTEGER),\\n customers.customer_name (VARCHAR(80)),\\n customers.customer_details (VARCHAR(255)),\\n)\\n\\nTABLE invoices (\\n invoices.invoice_number (INTEGER),\\n invoices.invoice_date (DATETIME),\\n invoices.invoice_details (VARCHAR(255)),\\n)\\n\\nTABLE order_items (\\n order_items.order_item_id (INTEGER),\\n order_items.product_id (INTEGER),\\n order_items.order_id (INTEGER),\\n order_items.order_item_status (VARCHAR(10)),\\n order_items.order_item_details (VARCHAR(255)),\\n)\\n\\nTABLE orders (\\n orders.order_id (INTEGER),\\n orders.customer_id (INTEGER),\\n orders.order_status (VARCHAR(10)),\\n orders.date_order_placed (DATETIME),\\n orders.order_details (VARCHAR(255)),\\n)\\n\\nTABLE products (\\n products.product_id (INTEGER),\\n products.product_name (VARCHAR(80)),\\n products.product_details (VARCHAR(255)),\\n)\\n\\nTABLE shipment_items (\\n shipment_items.shipment_id (INTEGER),\\n shipment_items.order_item_id (INTEGER),\\n)\\n\\nTABLE shipments (\\n shipments.shipment_id (INTEGER),\\n shipments.order_id (INTEGER),\\n shipments.invoice_number (INTEGER),\\n shipments.shipment_tracking_number (VARCHAR(80)),\\n shipments.shipment_date (DATETIME),\\n shipments.other_shipment_details (VARCHAR(255)),\\n)\\n\\n\\nPossible JOINs:\\n\\norder_items.product_id = products.product_id\\norder_items.order_id = orders.order_id\\n\\norders.customer_id = customers.customer_id\\n\\nshipment_items.shipment_id = shipments.shipment_id\\nshipment_items.order_item_id = order_items.order_item_id\\n\\nshipments.order_id = orders.order_id\\nshipments.invoice_number = invoices.invoice_number\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"text\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 8647,\n \"samples\": [\n \"<|begin_of_text|><|start_header_id|>system<|end_header_id|>\\n\\nCutting Knowledge Date: December 2023\\nToday Date: 06 Oct 2024\\n\\n<|eot_id|><|start_header_id|>user<|end_header_id|>\\n\\n# System:\\nGiven a user question and the schema of a database, your task is to generate an JSON with the the names of tables and columns of the schema that the question is referring to.\\n\\n# Schema:\\n```sql\\nTABLE event (\\n event.ID (INT),\\n event.Name (TEXT),\\n event.Stadium_ID (INT),\\n event.Year (TEXT),\\n)\\n\\nTABLE record (\\n record.ID (INT),\\n record.Result (TEXT),\\n record.Swimmer_ID (INT),\\n record.Event_ID (INT),\\n)\\n\\nTABLE stadium (\\n stadium.ID (INT),\\n stadium.name (TEXT),\\n stadium.Capacity (INT),\\n stadium.City (TEXT),\\n stadium.Country (TEXT),\\n stadium.Opening_year (INT),\\n)\\n\\nTABLE swimmer (\\n swimmer.ID (INT),\\n swimmer.name (TEXT),\\n swimmer.Nationality (TEXT),\\n swimmer.meter_100 (REAL),\\n swimmer.meter_200 (TEXT),\\n swimmer.meter_300 (TEXT),\\n swimmer.meter_400 (TEXT),\\n swimmer.meter_500 (TEXT),\\n swimmer.meter_600 (TEXT),\\n swimmer.meter_700 (TEXT),\\n swimmer.Time (TEXT),\\n)\\n\\n\\nPossible JOINs:\\n\\nevent.Stadium_ID = stadium.ID\\n\\nrecord.Swimmer_ID = swimmer.ID\\nrecord.Event_ID = event.ID\\n\\n```\\n\\n# Question: Which countries do not have a stadium that was opened after 2006?<|eot_id|><|start_header_id|>assistant<|end_header_id|>\\n\\n```json\\n{ 'stadium': ['ID', 'Country', 'Opening_year'] }\\n```<|eot_id|>\",\n \"<|begin_of_text|><|start_header_id|>system<|end_header_id|>\\n\\nCutting Knowledge Date: December 2023\\nToday Date: 06 Oct 2024\\n\\n<|eot_id|><|start_header_id|>user<|end_header_id|>\\n\\n# System:\\nGiven a user question and the schema of a database, your task is to generate an JSON with the the names of tables and columns of the schema that the question is referring to.\\n\\n# Schema:\\n```sql\\nTABLE film (\\n film.Film_ID (INT),\\n film.Title (TEXT),\\n film.Studio (TEXT),\\n film.Director (TEXT),\\n film.Gross_in_dollar (INT),\\n)\\n\\nTABLE film_market_estimation (\\n film_market_estimation.Estimation_ID (INT),\\n film_market_estimation.Low_Estimate (REAL),\\n film_market_estimation.High_Estimate (REAL),\\n film_market_estimation.Film_ID (INT),\\n film_market_estimation.Type (TEXT),\\n film_market_estimation.Market_ID (INT),\\n film_market_estimation.Year (INT),\\n)\\n\\nTABLE market (\\n market.Market_ID (INT),\\n market.Country (TEXT),\\n market.Number_cities (INT),\\n)\\n\\n\\nPossible JOINs:\\n\\nfilm_market_estimation.Film_ID = film.Film_ID\\nfilm_market_estimation.Market_ID = market.Market_ID\\n\\n```\\n\\n# Question: How many film are there?<|eot_id|><|start_header_id|>assistant<|end_header_id|>\\n\\n```json\\n{ 'film': ['Film_ID'] }\\n```<|eot_id|>\",\n \"<|begin_of_text|><|start_header_id|>system<|end_header_id|>\\n\\nCutting Knowledge Date: December 2023\\nToday Date: 06 Oct 2024\\n\\n<|eot_id|><|start_header_id|>user<|end_header_id|>\\n\\n# System:\\nGiven a user question and the schema of a database, your task is to generate an JSON with the the names of tables and columns of the schema that the question is referring to.\\n\\n# Schema:\\n```sql\\nTABLE book (\\n book.Book_ID (INT),\\n book.Title (TEXT),\\n book.Issues (REAL),\\n book.Writer (TEXT),\\n)\\n\\nTABLE publication (\\n publication.Publication_ID (INT),\\n publication.Book_ID (INT),\\n publication.Publisher (TEXT),\\n publication.Publication_Date (TEXT),\\n publication.Price (REAL),\\n)\\n\\n\\nPossible JOINs:\\n\\npublication.Book_ID = book.Book_ID\\n\\n```\\n\\n# Question: Show the title and publication dates of books.<|eot_id|><|start_header_id|>assistant<|end_header_id|>\\n\\n```json\\n{ 'book': ['Book_ID', 'Title'],\\n 'publication': ['Publication_ID', 'Book_ID', 'Publication_Date'] }\\n```<|eot_id|>\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}"
+ }
+ },
+ "metadata": {},
+ "execution_count": 14
+ }
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# df['n_tokens'] = df['text'].apply(lambda x: len(tokenizer.encode(x)))"
+ ],
+ "metadata": {
+ "id": "-8OByl30hBp7"
+ },
+ "execution_count": null,
+ "outputs": []
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# import seaborn as sns\n",
+ "# sns.histplot(df['n_tokens'])"
+ ],
+ "metadata": {
+ "id": "kFMVR-l6hRmx"
+ },
+ "execution_count": null,
+ "outputs": []
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "TxrNQ8OGvToc",
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ },
+ "outputId": "6ba5348c-6d3f-46ff-eed1-2eed5563f39d"
+ },
+ "outputs": [
+ {
+ "output_type": "stream",
+ "name": "stdout",
+ "text": [
+ "<|begin_of_text|><|start_header_id|>system<|end_header_id|>\n",
+ "\n",
+ "Cutting Knowledge Date: December 2023\n",
+ "Today Date: 06 Oct 2024\n",
+ "\n",
+ "<|eot_id|><|start_header_id|>user<|end_header_id|>\n",
+ "\n",
+ "# System:\n",
+ "Given a user question and the schema of a database, your task is to generate an JSON with the the names of tables and columns of the schema that the question is referring to.\n",
+ "\n",
+ "# Schema:\n",
+ "```sql\n",
+ "TABLE city (\n",
+ " city.City_ID (INT),\n",
+ " city.Official_Name (TEXT),\n",
+ " city.Status (TEXT),\n",
+ " city.Area_km_2 (REAL),\n",
+ " city.Population (REAL),\n",
+ " city.Census_Ranking (TEXT),\n",
+ ")\n",
+ "\n",
+ "TABLE competition_record (\n",
+ " competition_record.Competition_ID (INT),\n",
+ " competition_record.Farm_ID (INT),\n",
+ " competition_record.Rank (INT),\n",
+ ")\n",
+ "\n",
+ "TABLE farm (\n",
+ " farm.Farm_ID (INT),\n",
+ " farm.Year (INT),\n",
+ " farm.Total_Horses (REAL),\n",
+ " farm.Working_Horses (REAL),\n",
+ " farm.Total_Cattle (REAL),\n",
+ " farm.Oxen (REAL),\n",
+ " farm.Bulls (REAL),\n",
+ " farm.Cows (REAL),\n",
+ " farm.Pigs (REAL),\n",
+ " farm.Sheep_and_Goats (REAL),\n",
+ ")\n",
+ "\n",
+ "TABLE farm_competition (\n",
+ " farm_competition.Competition_ID (INT),\n",
+ " farm_competition.Year (INT),\n",
+ " farm_competition.Theme (TEXT),\n",
+ " farm_competition.Host_city_ID (INT),\n",
+ " farm_competition.Hosts (TEXT),\n",
+ ")\n",
+ "\n",
+ "\n",
+ "Possible JOINs:\n",
+ "\n",
+ "competition_record.Competition_ID = farm_competition.Competition_ID\n",
+ "competition_record.Farm_ID = farm.Farm_ID\n",
+ "\n",
+ "farm_competition.Host_city_ID = city.City_ID\n",
+ "\n",
+ "```\n",
+ "\n",
+ "# Question: Show the status shared by cities with population bigger than 1500 and smaller than 500.<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n",
+ "\n",
+ "```json\n",
+ "{ 'city': ['City_ID', 'Status', 'Population'] }\n",
+ "```<|eot_id|>\n"
+ ]
+ }
+ ],
+ "source": [
+ "print(df['text'][df.index[50]])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "jgNv1q3IA4J2"
+ },
+ "outputs": [],
+ "source": [
+ "_df = pd.DataFrame(columns=['text'])\n",
+ "_df['text'] = df.sample(frac=1, random_state=14).reset_index(drop=True)['text']\n",
+ "_df = Dataset.from_pandas(_df)\n",
+ "_df = _df.train_test_split(test_size=0.01, shuffle=True, seed=14)\n",
+ "train_dataset, valid_dataset = _df[\"train\"], _df[\"test\"]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# dataset = Dataset.from_pandas(df)\n",
+ "\n",
+ "# dataset_filtrado_tokens = dataset_easy_and_medium.filter(lambda example: len(tokenizer.tokenize(example['text'])) < 2048)\n",
+ "# dataset_filtrado_tokens\n",
+ "\n",
+ "# train_dataset = dataset_filtrado_tokens.train_test_split(test_size=0.01, shuffle=False, seed=42)[\"train\"]\n",
+ "# valid_dataset = dataset_filtrado_tokens.train_test_split(test_size=0.01, shuffle=False, seed=42)[\"test\"]"
+ ],
+ "metadata": {
+ "id": "h_ntoKppKjZ7"
+ },
+ "execution_count": null,
+ "outputs": []
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "id": "_I7-bFfm5gqS"
+ },
+ "source": [
+ "#### Chat Template - Gerar SQL"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# tokenizer.chat_template = \"\"\"\n",
+ "# {% if messages[0]['role'] == 'system' %}\n",
+ "# {% set loop_messages = messages[1:] %}\n",
+ "# {% set system_message = messages[0]['content'] %}\n",
+ "# {% else %}\n",
+ "# {% set loop_messages = messages %}\n",
+ "# {% set system_message = 'Given a user question and the schema of a database, your task is to generate an SQL query that accurately answers the question based on the provided schema.' %}\n",
+ "# {% endif %}\n",
+ "# {{ '# <|system|>/n/' + system_message + '/n//n/' }}\n",
+ "# {% if messages|selectattr(\"role\", \"equalto\", \"example\")|list %}\n",
+ "# Below are some examples of question and their corresponding SQL queries:/n//n/\n",
+ "# {% else %}\n",
+ "# /n/\n",
+ "# {% endif %}\n",
+ "# {% for message in loop_messages %}\n",
+ "# {% if message['role'] == 'example' %}\n",
+ "# {{ message['content'] }}/n//n/\n",
+ "# {% elif message['role'] == 'schema' %}\n",
+ "# # <|schema|>/n/The query will run on a database with the following schema:/n/{{ message['content'] }}/n//n/\n",
+ "# {% elif message['role'] == 'user' %}\n",
+ "# # <|user|>/n/[QUESTION]{{ message['content'] }}[/QUESTION]/n//n/\n",
+ "# {% elif message['role'] == 'assistant' %}\n",
+ "# # <|assistant|>/n/[SQL]{{ message['content'] }}[/SQL]\n",
+ "# {% endif %}\n",
+ "# {% endfor %}\n",
+ "# {% if add_generation_prompt %}\n",
+ "# # <|assistant|>/n/[SQL]\n",
+ "# {% endif %}\n",
+ "# \"\"\".replace(\"\\n\",\"\").replace(\" \", \"\").replace(\"/n/\", \"\\n\")"
+ ],
+ "metadata": {
+ "id": "cYVA3Q7ZCzHi"
+ },
+ "execution_count": null,
+ "outputs": []
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "import re\n",
+ "\n",
+ "def replace_alias_with_table(query):\n",
+ " # Expressão regular para encontrar tabelas com alias, capturando o nome da tabela e o alias\n",
+ " alias_pattern = re.compile(r'(\\bFROM\\b|\\bJOIN\\b)\\s+(\\w+)\\s+AS\\s+(\\w+)', re.IGNORECASE)\n",
+ "\n",
+ " # Substituições de aliases encontrados no padrão\n",
+ " aliases = {match.group(3): match.group(2) for match in alias_pattern.finditer(query)}\n",
+ "\n",
+ " # Substituir cada alias pelo nome da tabela correspondente\n",
+ " for alias, table in aliases.items():\n",
+ " query = re.sub(r'\\b' + alias + r'\\b', table, query)\n",
+ "\n",
+ " # Remover 'AS' e alias das cláusulas 'FROM' e 'JOIN'\n",
+ " query = re.sub(r'\\bAS\\s+\\w+', '', query, flags=re.IGNORECASE)\n",
+ " return query"
+ ],
+ "metadata": {
+ "id": "LTvflkdTJ1XB"
+ },
+ "execution_count": 10,
+ "outputs": []
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 11,
+ "metadata": {
+ "id": "6RDDdVgP5gqT"
+ },
+ "outputs": [],
+ "source": [
+ "def to_sql(query):\n",
+ " return sqlparse.format(replace_alias_with_table(query), reindent=True, keyword_case='upper')\n",
+ "\n",
+ "def apply_template(row, tokenizer=tokenizer, n_examplea=0):\n",
+ " question = row['question_en']\n",
+ " schema = row['schema_SQLDatabase_reduzido_tabelas']\n",
+ " sql = to_sql(row['query'])\n",
+ "\n",
+ " system = \"Given a user question and the schema of a database, your task is to generate an SQL query that accurately answers the question based on the provided schema.\"\n",
+ "\n",
+ " chat = [\n",
+ " {'role': 'system', 'content': system},\n",
+ " {'role': 'user', 'content': f\"# Schema:\\n```sql\\n{schema}\\n```\\n\\n# Question: {question}\"},\n",
+ " {'role': 'assistant', 'content': f\"```sql\\n{sql}\\n```\\n\"}\n",
+ " ]\n",
+ "\n",
+ " # chat = [\n",
+ " # {\"role\": \"schema\", \"content\": schema},\n",
+ " # {\"role\": \"user\", \"content\": question},\n",
+ " # {\"role\": \"assistant\", \"content\": sql},\n",
+ " # ]\n",
+ "\n",
+ " row['text'] = tokenizer.apply_chat_template(chat, tokenize=False, add_generation_prompt=False)\n",
+ "\n",
+ " return row"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "2trHEegL5gqU"
+ },
+ "outputs": [],
+ "source": [
+ "# spider_chain = json.load(open(\"/content/drive/Shareddrives/LLMs/Datasets/spider/spider_chain_of_thought.json\", \"r\"))\n",
+ "# bird_chain = json.load(open(\"/content/drive/Shareddrives/LLMs/Datasets/bird/bird_chain_of_thought.json\", \"r\"))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "N4jWrC7s5gqU"
+ },
+ "outputs": [],
+ "source": [
+ "# df['CoT'] = spider_chain + bird_chain"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "metadata": {
+ "id": "bTF0pBsw5gqU"
+ },
+ "outputs": [],
+ "source": [
+ "df = df.apply(apply_template, axis=1)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "L4tjUv7o5gqV"
+ },
+ "outputs": [],
+ "source": [
+ "df.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "DfJvLaGR5gqV"
+ },
+ "outputs": [],
+ "source": [
+ "# df['n_tokens'] = df['text'].apply(lambda x: len(tokenizer.encode(x)))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {
+ "id": "vJseOHIu5gqW"
+ },
+ "outputs": [],
+ "source": [
+ "# import seaborn as sns\n",
+ "# sns.histplot(df['n_tokens'])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 14,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ },
+ "outputId": "285b7e4f-3f82-4beb-b33e-b13bddffc8a3",
+ "id": "PIvSnr6Y5gqW"
+ },
+ "outputs": [
+ {
+ "output_type": "stream",
+ "name": "stdout",
+ "text": [
+ "<|im_start|>system\n",
+ "Given a user question and the schema of a database, your task is to generate an SQL query that accurately answers the question based on the provided schema.<|im_end|>\n",
+ "<|im_start|>user\n",
+ "# Schema:\n",
+ "```sql\n",
+ "CREATE TABLE city (\n",
+ " City_ID INT,\n",
+ " Official_Name TEXT,\n",
+ " Status TEXT,\n",
+ " Area_km_2 REAL,\n",
+ " Population REAL,\n",
+ " Census_Ranking TEXT,\n",
+ " PRIMARY KEY (City_ID)\n",
+ ");\n",
+ "```\n",
+ "\n",
+ "# Question: Show the status shared by cities with population bigger than 1500 and smaller than 500.<|im_end|>\n",
+ "<|im_start|>assistant\n",
+ "```sql\n",
+ "SELECT Status\n",
+ "FROM city\n",
+ "WHERE Population > 1500 INTERSECT\n",
+ " SELECT Status\n",
+ " FROM city WHERE Population < 500\n",
+ "```\n",
+ "<|im_end|>\n",
+ "\n"
+ ]
+ }
+ ],
+ "source": [
+ "print(df['text'][df.index[50]])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 15,
+ "metadata": {
+ "id": "roZzKNOj5gqW"
+ },
+ "outputs": [],
+ "source": [
+ "_df = pd.DataFrame(columns=['text'])\n",
+ "_df['text'] = df.sample(frac=1, random_state=14).reset_index(drop=True)['text']\n",
+ "_df = Dataset.from_pandas(_df)\n",
+ "_df = _df.train_test_split(test_size=0.01, shuffle=True, seed=14)\n",
+ "train_dataset, valid_dataset = _df[\"train\"], _df[\"test\"]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "id": "DWpXeuO_KlLS"
+ },
+ "source": [
+ "### Finetuning"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 17,
+ "metadata": {
+ "id": "0oVpZDj1AXY9",
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ },
+ "outputId": "1d313c21-2dbc-4170-c05a-7f9631dd6116"
+ },
+ "outputs": [
+ {
+ "output_type": "stream",
+ "name": "stdout",
+ "text": [
+ "The token has not been saved to the git credentials helper. Pass `add_to_git_credential=True` in this function directly or `--add-to-git-credential` if using via `huggingface-cli` if you want to set the git credential as well.\n",
+ "Token is valid (permission: write).\n",
+ "Your token has been saved to /root/.cache/huggingface/token\n",
+ "Login successful\n"
+ ]
+ }
+ ],
+ "source": [
+ "from huggingface_hub import login, create_repo\n",
+ "from google.colab import userdata\n",
+ "import os\n",
+ "\n",
+ "#token = userdata.get('hf_write')\n",
+ "token = WRITE_TOKEN\n",
+ "login(token=token)\n",
+ "set_seed(1234)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 18,
+ "metadata": {
+ "id": "KRhO7UJ-Q4Y8"
+ },
+ "outputs": [],
+ "source": [
+ "def find_all_linear_names(model, new_tokens=False):\n",
+ " lora_module_names = set()\n",
+ " for name, module in model.named_modules():\n",
+ " if isinstance(module, bnb.nn.Linear4bit) or isinstance(module, bnb.nn.Linear8bitLt):\n",
+ " names = name.split(\".\")\n",
+ " lora_module_names.add(names[0] if len(names) == 1 else names[-1])\n",
+ " if(new_tokens):\n",
+ " lora_module_names.add(\"lm_head\")\n",
+ " return list(lora_module_names)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 19,
+ "metadata": {
+ "id": "L0qqP5Y9PtRh",
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ },
+ "outputId": "038fbb67-16cc-4d7f-9199-9694451ee801"
+ },
+ "outputs": [
+ {
+ "output_type": "stream",
+ "name": "stdout",
+ "text": [
+ "Found 7 modules to quantize: ['o_proj', 'up_proj', 'v_proj', 'gate_proj', 'q_proj', 'down_proj', 'k_proj']\n"
+ ]
+ }
+ ],
+ "source": [
+ "modules = find_all_linear_names(model)\n",
+ "print(f\"Found {len(modules)} modules to quantize: {modules}\")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 20,
+ "metadata": {
+ "id": "uFUnJrbjPwAT"
+ },
+ "outputs": [],
+ "source": [
+ "peft_config = LoraConfig(\n",
+ " lora_alpha=128, #primeira versão = 16\n",
+ " lora_dropout=0.1,\n",
+ " r=64,\n",
+ " # bias=\"none\",\n",
+ " # task_type=\"CAUSAL_LM\",\n",
+ " target_modules=modules,\n",
+ " # modules_to_save=[\"embed_tokens\"], #quando adicionar tokens speciais\n",
+ ")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 21,
+ "metadata": {
+ "id": "buh0o2P2jwbx"
+ },
+ "outputs": [],
+ "source": [
+ "torch.cuda.empty_cache()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 22,
+ "metadata": {
+ "id": "9bD7ea0F-GQn",
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 1000,
+ "referenced_widgets": [
+ "780c1ae797ee48cb97e2530eb2a8a49f",
+ "651fc5f1f3384c77a96380a2e35a9ac4",
+ "9a37ef338ef74693ba6547b246e432a3",
+ "1ef299925fa7408a9374be0b740a9e95",
+ "ff9bfd5baa2e496dbe4d8c2a7cad3b93",
+ "35597aaf146943999889a889041a2363",
+ "396417cb735d4e879e3592274563377d",
+ "920d3a1046604736a4adea3d06c91c46",
+ "38f10f50c1de4041a647c36051439196",
+ "bd73e52a62554625a6ffa35de8b1fcb4",
+ "b2bf77031dbb4704a7c5db2092e96b79",
+ "b412f8a8fba5467cb11facd8ec1aedf4",
+ "844556f6f4f5414f8cb94a05ba81e5f3",
+ "16402df70c754eacacf0e2c75790248b",
+ "9923bcd6780044cbb60d110320cb3fa3",
+ "35761e009c8d4882b6a2fb40c363f372",
+ "897879b0d7dd44498eb3dd9b882e943c",
+ "c59dbd844df0496b811ff3793d4827c6",
+ "4ab4dd1eb03547bc9631ea18caf21881",
+ "6fff8b423cb84d03b68049989a4f1174",
+ "376c9b894ccb4c8aa00e06adba02ad9a",
+ "c65ff75932ad45ffb417949562c68332"
+ ]
+ },
+ "outputId": "6ac1c196-d654-4f49-fe2c-164ba72903b8"
+ },
+ "outputs": [
+ {
+ "metadata": {
+ "tags": null
+ },
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "/usr/local/lib/python3.10/dist-packages/huggingface_hub/utils/_deprecation.py:100: FutureWarning: Deprecated argument(s) used in '__init__': dataset_text_field, max_seq_length. Will not be supported from version '0.13.0'.\n",
+ "\n",
+ "Deprecated positional argument(s) used in SFTTrainer, please use the SFTConfig to set these arguments instead.\n",
+ " warnings.warn(message, FutureWarning)\n",
+ "/usr/local/lib/python3.10/dist-packages/trl/trainer/sft_trainer.py:300: UserWarning: You passed a `max_seq_length` argument to the SFTTrainer, the value you passed will override the one in the `SFTConfig`.\n",
+ " warnings.warn(\n",
+ "/usr/local/lib/python3.10/dist-packages/trl/trainer/sft_trainer.py:328: UserWarning: You passed a `dataset_text_field` argument to the SFTTrainer, the value you passed will override the one in the `SFTConfig`.\n",
+ " warnings.warn(\n"
+ ]
+ },
+ {
+ "data": {
+ "application/vnd.jupyter.widget-view+json": {
+ "model_id": "780c1ae797ee48cb97e2530eb2a8a49f",
+ "version_major": 2,
+ "version_minor": 0
+ },
+ "text/plain": [
+ "Map: 0%| | 0/8569 [00:00, ? examples/s]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "data": {
+ "application/vnd.jupyter.widget-view+json": {
+ "model_id": "b412f8a8fba5467cb11facd8ec1aedf4",
+ "version_major": 2,
+ "version_minor": 0
+ },
+ "text/plain": [
+ "Map: 0%| | 0/87 [00:00, ? examples/s]"
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "metadata": {
+ "tags": null
+ },
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "/usr/local/lib/python3.10/dist-packages/accelerate/accelerator.py:494: FutureWarning: `torch.cuda.amp.GradScaler(args...)` is deprecated. Please use `torch.amp.GradScaler('cuda', args...)` instead.\n",
+ " self.scaler = torch.cuda.amp.GradScaler(**kwargs)\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/_dynamo/eval_frame.py:600: UserWarning: torch.utils.checkpoint: the use_reentrant parameter should be passed explicitly. In version 2.4 we will raise an exception if use_reentrant is not passed. use_reentrant=False is recommended, but if you need to preserve the current default behavior, you can pass use_reentrant=True. Refer to docs for more details on the differences between the two variants.\n",
+ " return fn(*args, **kwargs)\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/utils/checkpoint.py:295: FutureWarning: `torch.cpu.amp.autocast(args...)` is deprecated. Please use `torch.amp.autocast('cpu', args...)` instead.\n",
+ " with torch.enable_grad(), device_autocast_ctx, torch.cpu.amp.autocast(**ctx.cpu_autocast_kwargs): # type: ignore[attr-defined]\n"
+ ]
+ },
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ " \n",
+ " \n",
+ "
\n",
+ " [ 526/1071 1:08:50 < 1:11:35, 0.13 it/s, Epoch 0.49/1]\n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " Step | \n",
+ " Training Loss | \n",
+ " Validation Loss | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 250 | \n",
+ " 0.454300 | \n",
+ " 0.294916 | \n",
+ "
\n",
+ " \n",
+ " 500 | \n",
+ " 0.248900 | \n",
+ " 0.247413 | \n",
+ "
\n",
+ " \n",
+ "
"
+ ],
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {},
+ "output_type": "display_data"
+ },
+ {
+ "metadata": {
+ "tags": null
+ },
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "Trainer.tokenizer is now deprecated. You should use Trainer.processing_class instead.\n",
+ "Trainer.tokenizer is now deprecated. You should use Trainer.processing_class instead.\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/_dynamo/eval_frame.py:600: UserWarning: torch.utils.checkpoint: the use_reentrant parameter should be passed explicitly. In version 2.4 we will raise an exception if use_reentrant is not passed. use_reentrant=False is recommended, but if you need to preserve the current default behavior, you can pass use_reentrant=True. Refer to docs for more details on the differences between the two variants.\n",
+ " return fn(*args, **kwargs)\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/utils/checkpoint.py:295: FutureWarning: `torch.cpu.amp.autocast(args...)` is deprecated. Please use `torch.amp.autocast('cpu', args...)` instead.\n",
+ " with torch.enable_grad(), device_autocast_ctx, torch.cpu.amp.autocast(**ctx.cpu_autocast_kwargs): # type: ignore[attr-defined]\n",
+ "Trainer.tokenizer is now deprecated. You should use Trainer.processing_class instead.\n",
+ "Trainer.tokenizer is now deprecated. You should use Trainer.processing_class instead.\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/_dynamo/eval_frame.py:600: UserWarning: torch.utils.checkpoint: the use_reentrant parameter should be passed explicitly. In version 2.4 we will raise an exception if use_reentrant is not passed. use_reentrant=False is recommended, but if you need to preserve the current default behavior, you can pass use_reentrant=True. Refer to docs for more details on the differences between the two variants.\n",
+ " return fn(*args, **kwargs)\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/utils/checkpoint.py:295: FutureWarning: `torch.cpu.amp.autocast(args...)` is deprecated. Please use `torch.amp.autocast('cpu', args...)` instead.\n",
+ " with torch.enable_grad(), device_autocast_ctx, torch.cpu.amp.autocast(**ctx.cpu_autocast_kwargs): # type: ignore[attr-defined]\n"
+ ]
+ },
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ ""
+ ],
+ "text/html": [
+ "\n",
+ " \n",
+ " \n",
+ "
\n",
+ " [1071/1071 2:20:02, Epoch 0/1]\n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " Step | \n",
+ " Training Loss | \n",
+ " Validation Loss | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 250 | \n",
+ " 0.454300 | \n",
+ " 0.294916 | \n",
+ "
\n",
+ " \n",
+ " 500 | \n",
+ " 0.248900 | \n",
+ " 0.247413 | \n",
+ "
\n",
+ " \n",
+ " 750 | \n",
+ " 0.220500 | \n",
+ " 0.221026 | \n",
+ "
\n",
+ " \n",
+ " 1000 | \n",
+ " 0.204900 | \n",
+ " 0.212971 | \n",
+ "
\n",
+ " \n",
+ "
"
+ ]
+ },
+ "metadata": {}
+ },
+ {
+ "output_type": "stream",
+ "name": "stderr",
+ "text": [
+ "Trainer.tokenizer is now deprecated. You should use Trainer.processing_class instead.\n",
+ "Trainer.tokenizer is now deprecated. You should use Trainer.processing_class instead.\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/_dynamo/eval_frame.py:600: UserWarning: torch.utils.checkpoint: the use_reentrant parameter should be passed explicitly. In version 2.4 we will raise an exception if use_reentrant is not passed. use_reentrant=False is recommended, but if you need to preserve the current default behavior, you can pass use_reentrant=True. Refer to docs for more details on the differences between the two variants.\n",
+ " return fn(*args, **kwargs)\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/utils/checkpoint.py:295: FutureWarning: `torch.cpu.amp.autocast(args...)` is deprecated. Please use `torch.amp.autocast('cpu', args...)` instead.\n",
+ " with torch.enable_grad(), device_autocast_ctx, torch.cpu.amp.autocast(**ctx.cpu_autocast_kwargs): # type: ignore[attr-defined]\n",
+ "Trainer.tokenizer is now deprecated. You should use Trainer.processing_class instead.\n",
+ "Trainer.tokenizer is now deprecated. You should use Trainer.processing_class instead.\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/_dynamo/eval_frame.py:600: UserWarning: torch.utils.checkpoint: the use_reentrant parameter should be passed explicitly. In version 2.4 we will raise an exception if use_reentrant is not passed. use_reentrant=False is recommended, but if you need to preserve the current default behavior, you can pass use_reentrant=True. Refer to docs for more details on the differences between the two variants.\n",
+ " return fn(*args, **kwargs)\n",
+ "/usr/local/lib/python3.10/dist-packages/torch/utils/checkpoint.py:295: FutureWarning: `torch.cpu.amp.autocast(args...)` is deprecated. Please use `torch.amp.autocast('cpu', args...)` instead.\n",
+ " with torch.enable_grad(), device_autocast_ctx, torch.cpu.amp.autocast(**ctx.cpu_autocast_kwargs): # type: ignore[attr-defined]\n"
+ ]
+ }
+ ],
+ "source": [
+ "steps=250\n",
+ "strategy=\"steps\"\n",
+ "\n",
+ "trainer = SFTTrainer(\n",
+ " model= model,\n",
+ " tokenizer=tokenizer,\n",
+ "\n",
+ " train_dataset=train_dataset,\n",
+ " eval_dataset=valid_dataset,\n",
+ "\n",
+ " peft_config=peft_config,\n",
+ "\n",
+ " dataset_text_field=\"text\",\n",
+ " max_seq_length=2048,\n",
+ " args= TrainingArguments(\n",
+ " output_dir=\"out\",\n",
+ "\n",
+ " save_strategy=strategy,\n",
+ " save_steps= steps,\n",
+ "\n",
+ " logging_strategy=strategy,\n",
+ " logging_steps=steps,\n",
+ " logging_dir=\"out/logs\",\n",
+ "\n",
+ " eval_strategy=strategy,\n",
+ " eval_steps=steps,\n",
+ "\n",
+ " num_train_epochs=1,\n",
+ " per_device_train_batch_size=1,\n",
+ " per_device_eval_batch_size=1,\n",
+ " gradient_accumulation_steps=8, #primeira versão era 1\n",
+ " gradient_checkpointing=True,\n",
+ " fp16=True,\n",
+ " bf16=False,\n",
+ "\n",
+ " optim=\"paged_adamw_8bit\",\n",
+ " learning_rate=1e-4, #primeira versão era 2e-4,\n",
+ " weight_decay=0.001,\n",
+ " max_grad_norm=0.3,\n",
+ " max_steps=-1,\n",
+ " warmup_ratio=0.03,\n",
+ " group_by_length=True,\n",
+ " lr_scheduler_type=\"cosine\", #primeira versão era linear\n",
+ " seed= seed,\n",
+ "\n",
+ "\n",
+ " report_to=[\"tensorboard\"],\n",
+ " push_to_hub=True,\n",
+ " hub_strategy=\"all_checkpoints\",\n",
+ " hub_model_id=out_name,\n",
+ "\n",
+ " label_names=[\"labels\"]\n",
+ " )\n",
+ "\n",
+ ")\n",
+ "if(prev_checkpoint != None):\n",
+ " trainer.train(f\"out/{prev_checkpoint}\")\n",
+ "else:\n",
+ " trainer.train()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 23,
+ "metadata": {
+ "id": "i39Ov4dsGv77",
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 52
+ },
+ "outputId": "d7c5f985-a1e4-426e-db42-6049ea4f59dc"
+ },
+ "outputs": [
+ {
+ "output_type": "execute_result",
+ "data": {
+ "text/plain": [
+ "CommitInfo(commit_url='https://huggingface.co/lleticiasilvaa/StableCode-text2SQL-schemaReduzidoTabelas/commit/5796bc794767f39348649736c8a9b7c88f12421d', commit_message='End of training', commit_description='', oid='5796bc794767f39348649736c8a9b7c88f12421d', pr_url=None, pr_revision=None, pr_num=None)"
+ ],
+ "application/vnd.google.colaboratory.intrinsic+json": {
+ "type": "string"
+ }
+ },
+ "metadata": {},
+ "execution_count": 23
+ }
+ ],
+ "source": [
+ "trainer.push_to_hub()"
+ ]
+ }
+ ],
+ "metadata": {
+ "accelerator": "GPU",
+ "colab": {
+ "gpuType": "T4",
+ "provenance": [],
+ "collapsed_sections": [
+ "leGEqxURAL4r"
+ ]
+ },
+ "kernelspec": {
+ "display_name": "default:Python",
+ "language": "python",
+ "name": "conda-env-default-py"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.9.16"
+ },
+ "widgets": {
+ "application/vnd.jupyter.widget-state+json": {
+ "62b5a4803207499da82677b9b146b97b": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_1c006910a42e40728867969135b6d848",
+ "IPY_MODEL_1a5af1ef864e41d99a79d5b94d982711",
+ "IPY_MODEL_a84dab2f85094fb3997adb2d3c2ecd0a"
+ ],
+ "layout": "IPY_MODEL_bcc0fee091bb4a308e9c39e2ae091acd"
+ }
+ },
+ "1c006910a42e40728867969135b6d848": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_349dd7e2bfd141a583b8ec25b786cae3",
+ "placeholder": "",
+ "style": "IPY_MODEL_29717b10d1bd45cba1a785123bd2a0b4",
+ "value": "README.md: 100%"
+ }
+ },
+ "1a5af1ef864e41d99a79d5b94d982711": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_319f0c7c10c546b3a1be237d93ebf5ae",
+ "max": 885,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_7c0a09f10b59412ba4271ba77a1378f0",
+ "value": 885
+ }
+ },
+ "a84dab2f85094fb3997adb2d3c2ecd0a": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_ba00c487942a4c50ad032aad072a6f7b",
+ "placeholder": "",
+ "style": "IPY_MODEL_11d0433884ca4e46b7cb033b5e546ad4",
+ "value": " 885/885 [00:00<00:00, 37.2kB/s]"
+ }
+ },
+ "bcc0fee091bb4a308e9c39e2ae091acd": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "349dd7e2bfd141a583b8ec25b786cae3": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "29717b10d1bd45cba1a785123bd2a0b4": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "319f0c7c10c546b3a1be237d93ebf5ae": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "7c0a09f10b59412ba4271ba77a1378f0": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "ba00c487942a4c50ad032aad072a6f7b": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "11d0433884ca4e46b7cb033b5e546ad4": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "eb2518b1c019478daec2d2c058898096": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_c25c3c6ca8f343c2b7519abca165c779",
+ "IPY_MODEL_207cc561423a413c975d54acfdfd73a4",
+ "IPY_MODEL_d86de6918ba94a159b0c48b33bc9d90c"
+ ],
+ "layout": "IPY_MODEL_22531ea2c5fe493ca2a87b8432424371"
+ }
+ },
+ "c25c3c6ca8f343c2b7519abca165c779": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_964dfefdf21648a6a2ab33a935efb4e7",
+ "placeholder": "",
+ "style": "IPY_MODEL_6d9d4727e4734795a65a12306e1db3e9",
+ "value": "dev-00000-of-00001.parquet: 100%"
+ }
+ },
+ "207cc561423a413c975d54acfdfd73a4": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_cfa5cebbda604836bfb3daf1a0a9eb5b",
+ "max": 368731,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_bf0121739fac4cab8a6a56f607e99067",
+ "value": 368731
+ }
+ },
+ "d86de6918ba94a159b0c48b33bc9d90c": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_2cf8d94d40d14f9ab02389fe857a44e7",
+ "placeholder": "",
+ "style": "IPY_MODEL_ca3279d8e8d14ae3958efd4990d760f5",
+ "value": " 369k/369k [00:00<00:00, 12.1MB/s]"
+ }
+ },
+ "22531ea2c5fe493ca2a87b8432424371": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "964dfefdf21648a6a2ab33a935efb4e7": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "6d9d4727e4734795a65a12306e1db3e9": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "cfa5cebbda604836bfb3daf1a0a9eb5b": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "bf0121739fac4cab8a6a56f607e99067": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "2cf8d94d40d14f9ab02389fe857a44e7": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "ca3279d8e8d14ae3958efd4990d760f5": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "3b861b5eb85a4eb1a5800dd33e199b88": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_f60ecb97d13d4056a7295306b4a726f3",
+ "IPY_MODEL_7ed9c3225ff34256bb3d105a541a2dbb",
+ "IPY_MODEL_8ed8b8ef97fd4b4cbb03f6954fa70367"
+ ],
+ "layout": "IPY_MODEL_4651ad7190a047f98bbf3817e529f9f8"
+ }
+ },
+ "f60ecb97d13d4056a7295306b4a726f3": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_22d3f097275c42869bc2bc07b70b99f4",
+ "placeholder": "",
+ "style": "IPY_MODEL_82b145ecd4994698b56223f44c695054",
+ "value": "train-00000-of-00001.parquet: 100%"
+ }
+ },
+ "7ed9c3225ff34256bb3d105a541a2dbb": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_ec2be65f2cdb476ea1717ef7040f839a",
+ "max": 2699654,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_35c2672c5c8542dd80d92167dd9d9163",
+ "value": 2699654
+ }
+ },
+ "8ed8b8ef97fd4b4cbb03f6954fa70367": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_aa21408da1eb4d1bb1a2aa00eedc9412",
+ "placeholder": "",
+ "style": "IPY_MODEL_938befa273d944d6932eafd292376a7b",
+ "value": " 2.70M/2.70M [00:00<00:00, 10.3MB/s]"
+ }
+ },
+ "4651ad7190a047f98bbf3817e529f9f8": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "22d3f097275c42869bc2bc07b70b99f4": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "82b145ecd4994698b56223f44c695054": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "ec2be65f2cdb476ea1717ef7040f839a": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "35c2672c5c8542dd80d92167dd9d9163": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "aa21408da1eb4d1bb1a2aa00eedc9412": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "938befa273d944d6932eafd292376a7b": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "d786b4589eaa4a9d8dd1a17beb71a42c": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_3f0ddb4d9e5346b8b6d46e3dd1f5a848",
+ "IPY_MODEL_0ec766ee8a12493492e591aae846821e",
+ "IPY_MODEL_ee72b1d5917e4377b4140d04b6238961"
+ ],
+ "layout": "IPY_MODEL_1a9cdc5f9aa84a3abe8a93d51bda8cf4"
+ }
+ },
+ "3f0ddb4d9e5346b8b6d46e3dd1f5a848": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_8ba0c5c19e7b40e3b1987a274f04e780",
+ "placeholder": "",
+ "style": "IPY_MODEL_cad63d5f62d04a0987898969ec0bc4fb",
+ "value": "Generating dev split: 100%"
+ }
+ },
+ "0ec766ee8a12493492e591aae846821e": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_30a5dcee7cc142ec8a8f6b2888853fab",
+ "max": 1034,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_69f97bec934b444993afa7056655ee4d",
+ "value": 1034
+ }
+ },
+ "ee72b1d5917e4377b4140d04b6238961": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_485a0a650475469686655c0326849223",
+ "placeholder": "",
+ "style": "IPY_MODEL_bd7f555c54e84745b3ee0bf5d3bbe65f",
+ "value": " 1034/1034 [00:00<00:00, 14987.27 examples/s]"
+ }
+ },
+ "1a9cdc5f9aa84a3abe8a93d51bda8cf4": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "8ba0c5c19e7b40e3b1987a274f04e780": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "cad63d5f62d04a0987898969ec0bc4fb": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "30a5dcee7cc142ec8a8f6b2888853fab": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "69f97bec934b444993afa7056655ee4d": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "485a0a650475469686655c0326849223": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "bd7f555c54e84745b3ee0bf5d3bbe65f": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "5abd0ad065d74e5090902ca9420e9eda": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_8dd111f5c4c84ef0b1213a7cf20db429",
+ "IPY_MODEL_563de63f39af4f949944c2bcc79e2f62",
+ "IPY_MODEL_279032b33e64433d8c5ac7d7a1bf4b2b"
+ ],
+ "layout": "IPY_MODEL_a7f20c1db6014748b1c9d567b29bdb76"
+ }
+ },
+ "8dd111f5c4c84ef0b1213a7cf20db429": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_7f1157ebb5a04a4bb3c7b83df53fd206",
+ "placeholder": "",
+ "style": "IPY_MODEL_1c54e6b541dc40038b3d176af7949ee2",
+ "value": "Generating train split: 100%"
+ }
+ },
+ "563de63f39af4f949944c2bcc79e2f62": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_5562393293ea45c1972f520b5740cb08",
+ "max": 8656,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_42199373c5e747b1a59973878319f8e5",
+ "value": 8656
+ }
+ },
+ "279032b33e64433d8c5ac7d7a1bf4b2b": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_48ba0bcad819498282222df452525e9e",
+ "placeholder": "",
+ "style": "IPY_MODEL_3f2265210736450d93657b7e2a6b2785",
+ "value": " 8656/8656 [00:00<00:00, 61417.89 examples/s]"
+ }
+ },
+ "a7f20c1db6014748b1c9d567b29bdb76": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "7f1157ebb5a04a4bb3c7b83df53fd206": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "1c54e6b541dc40038b3d176af7949ee2": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "5562393293ea45c1972f520b5740cb08": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "42199373c5e747b1a59973878319f8e5": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "48ba0bcad819498282222df452525e9e": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "3f2265210736450d93657b7e2a6b2785": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "cf7e01f9046d4c22962a648618ad5f7c": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_84c68e15eddf448198c54a22175a6d9f",
+ "IPY_MODEL_ab1cd082922948358849b31b0b692fe8",
+ "IPY_MODEL_5f39764fc13c4a7faf40d12323cfc576"
+ ],
+ "layout": "IPY_MODEL_24a43873ea4a4475aa032f163cc32822"
+ }
+ },
+ "84c68e15eddf448198c54a22175a6d9f": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_97bb8763995744c6afc3a93010f7bf26",
+ "placeholder": "",
+ "style": "IPY_MODEL_81b8562116614219b51c3dfa404f3684",
+ "value": "tokenizer_config.json: 100%"
+ }
+ },
+ "ab1cd082922948358849b31b0b692fe8": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_0458f04bba74415fb420e5f4e50dd80b",
+ "max": 9354,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_71cc2397a4704f8486624917e47f8c99",
+ "value": 9354
+ }
+ },
+ "5f39764fc13c4a7faf40d12323cfc576": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_0a7c233068d5420e8fbe3a7bdc749825",
+ "placeholder": "",
+ "style": "IPY_MODEL_dcbb0e372cdd460b8284e3cce24437ef",
+ "value": " 9.35k/9.35k [00:00<00:00, 419kB/s]"
+ }
+ },
+ "24a43873ea4a4475aa032f163cc32822": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "97bb8763995744c6afc3a93010f7bf26": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "81b8562116614219b51c3dfa404f3684": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "0458f04bba74415fb420e5f4e50dd80b": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "71cc2397a4704f8486624917e47f8c99": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "0a7c233068d5420e8fbe3a7bdc749825": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "dcbb0e372cdd460b8284e3cce24437ef": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "37be9d87487f4a65bb3a553e054a9b9f": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_af62d0e253db43e4a5f8fc0399134e33",
+ "IPY_MODEL_45e6842e357d466b88547e967afbce15",
+ "IPY_MODEL_41caf3b8544243ee8080990bcc37f202"
+ ],
+ "layout": "IPY_MODEL_94fabb6c25b140b08dd87fec35836d17"
+ }
+ },
+ "af62d0e253db43e4a5f8fc0399134e33": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_4b615c1e58ed42238a6ebfefec23914b",
+ "placeholder": "",
+ "style": "IPY_MODEL_af2d34bfc6994559b9c524f7963a4623",
+ "value": "tokenizer.json: 100%"
+ }
+ },
+ "45e6842e357d466b88547e967afbce15": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_bdf850ca809641568d696016eb893909",
+ "max": 2117889,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_3ee1870576a747ffa1c87688e45f3e73",
+ "value": 2117889
+ }
+ },
+ "41caf3b8544243ee8080990bcc37f202": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_c3b5bb9e533f4e39aff22756d9437f88",
+ "placeholder": "",
+ "style": "IPY_MODEL_891d8fe057e046f18654f34fe15f097f",
+ "value": " 2.12M/2.12M [00:04<00:00, 472kB/s]"
+ }
+ },
+ "94fabb6c25b140b08dd87fec35836d17": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "4b615c1e58ed42238a6ebfefec23914b": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "af2d34bfc6994559b9c524f7963a4623": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "bdf850ca809641568d696016eb893909": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "3ee1870576a747ffa1c87688e45f3e73": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "c3b5bb9e533f4e39aff22756d9437f88": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "891d8fe057e046f18654f34fe15f097f": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "2c3628d3032f43f1a5698b863422be9c": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_14a14a1fac1544cb921ef83b10dfad26",
+ "IPY_MODEL_9b726ac9cd324096a730c57a9e306db3",
+ "IPY_MODEL_01059ed672f942b3a11810fd7d990853"
+ ],
+ "layout": "IPY_MODEL_c14ef71f64a240ca913aafc077f3f4b4"
+ }
+ },
+ "14a14a1fac1544cb921ef83b10dfad26": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_87112b2495a648ca98145db2f05fd164",
+ "placeholder": "",
+ "style": "IPY_MODEL_0475ba7ffbe54055aecd6e0b62a41eea",
+ "value": "special_tokens_map.json: 100%"
+ }
+ },
+ "9b726ac9cd324096a730c57a9e306db3": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_c0240edf852948608aba0016c26fc1cc",
+ "max": 587,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_332f7aafae624667896b6ae037033e65",
+ "value": 587
+ }
+ },
+ "01059ed672f942b3a11810fd7d990853": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_0ba5fc5f0fed4f2a92e570763fe9514c",
+ "placeholder": "",
+ "style": "IPY_MODEL_c571fd0656fc4a2292b0496b86f07a36",
+ "value": " 587/587 [00:00<00:00, 34.6kB/s]"
+ }
+ },
+ "c14ef71f64a240ca913aafc077f3f4b4": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "87112b2495a648ca98145db2f05fd164": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "0475ba7ffbe54055aecd6e0b62a41eea": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "c0240edf852948608aba0016c26fc1cc": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "332f7aafae624667896b6ae037033e65": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "0ba5fc5f0fed4f2a92e570763fe9514c": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "c571fd0656fc4a2292b0496b86f07a36": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "a0cb3fa115ef4c2e90618a9fd9249e9c": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_f293ba1eea304c43bdd509fe0cc8ec2d",
+ "IPY_MODEL_584d189f4dd142a2a7c3b918b1931317",
+ "IPY_MODEL_0fce315e9869484282dc65a57683326d"
+ ],
+ "layout": "IPY_MODEL_45c356d16449493fba9c25b6b2e1c98c"
+ }
+ },
+ "f293ba1eea304c43bdd509fe0cc8ec2d": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_9dc83ec606f74b95b830483b7b83e6ab",
+ "placeholder": "",
+ "style": "IPY_MODEL_d993a4247cb94b1db6df1d285566c8d2",
+ "value": "config.json: 100%"
+ }
+ },
+ "584d189f4dd142a2a7c3b918b1931317": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_d860e096167848d0b094c4bd0ba64736",
+ "max": 738,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_f15be96d251b486798e6b14b40ae11ec",
+ "value": 738
+ }
+ },
+ "0fce315e9869484282dc65a57683326d": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_b6959704534e47f893acb1680f78de96",
+ "placeholder": "",
+ "style": "IPY_MODEL_1b8b35c3d62d48c49b1bbdfe3bbece99",
+ "value": " 738/738 [00:00<00:00, 46.0kB/s]"
+ }
+ },
+ "45c356d16449493fba9c25b6b2e1c98c": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "9dc83ec606f74b95b830483b7b83e6ab": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "d993a4247cb94b1db6df1d285566c8d2": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "d860e096167848d0b094c4bd0ba64736": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "f15be96d251b486798e6b14b40ae11ec": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "b6959704534e47f893acb1680f78de96": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "1b8b35c3d62d48c49b1bbdfe3bbece99": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "67185d66e50e4578bdabd94304bb673b": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_0c8f9ab0f09a4cb2be56c75597b38a0a",
+ "IPY_MODEL_9a3828a9c40e4daba6578feb3cb0a35b",
+ "IPY_MODEL_3f45fde4bd4545ffbdbd1ddbef2ce73e"
+ ],
+ "layout": "IPY_MODEL_4f82b90d6ca945bcb18dac112bc8db7a"
+ }
+ },
+ "0c8f9ab0f09a4cb2be56c75597b38a0a": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_12398d8c1ffb4d74bfdd994048680dd5",
+ "placeholder": "",
+ "style": "IPY_MODEL_0b0fc0706a9a4f72a20eb8f8eade3193",
+ "value": "model.safetensors.index.json: 100%"
+ }
+ },
+ "9a3828a9c40e4daba6578feb3cb0a35b": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_740d7936fe2e4bf48d4920a5382087d7",
+ "max": 29396,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_b8776171b87e47e1a2212377ee796fdd",
+ "value": 29396
+ }
+ },
+ "3f45fde4bd4545ffbdbd1ddbef2ce73e": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_ce431e3b540c4b59ac4f8bcc5b7078b6",
+ "placeholder": "",
+ "style": "IPY_MODEL_b276a81e7a2b4e668381f920c11e8dc9",
+ "value": " 29.4k/29.4k [00:00<00:00, 1.69MB/s]"
+ }
+ },
+ "4f82b90d6ca945bcb18dac112bc8db7a": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "12398d8c1ffb4d74bfdd994048680dd5": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "0b0fc0706a9a4f72a20eb8f8eade3193": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "740d7936fe2e4bf48d4920a5382087d7": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "b8776171b87e47e1a2212377ee796fdd": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "ce431e3b540c4b59ac4f8bcc5b7078b6": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "b276a81e7a2b4e668381f920c11e8dc9": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "1562cb138c5a413c859a701ed5b70dba": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_ce568bd1899d4fe7abe491fef73e65a4",
+ "IPY_MODEL_161024aa2e3448e79ba1ba526d92a5ea",
+ "IPY_MODEL_150d10024dea40719982531fcf59d331"
+ ],
+ "layout": "IPY_MODEL_1ffd6a8ce6a94bdc93a0a380facb573e"
+ }
+ },
+ "ce568bd1899d4fe7abe491fef73e65a4": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_8cf991e531204a56a5af81ea2898f704",
+ "placeholder": "",
+ "style": "IPY_MODEL_c3360cc53a6e42d9af6e2262cf86d051",
+ "value": "Downloading shards: 100%"
+ }
+ },
+ "161024aa2e3448e79ba1ba526d92a5ea": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_c9eec2a0fc6b4edc9c19f231b055ec9b",
+ "max": 2,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_44b44e629a0c43199ffa6eee0882c091",
+ "value": 2
+ }
+ },
+ "150d10024dea40719982531fcf59d331": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_74ba3634127e4b9185b25e48ba7ebe3a",
+ "placeholder": "",
+ "style": "IPY_MODEL_dbf30f5fe7214c129d324bdca133973a",
+ "value": " 2/2 [02:20<00:00, 60.52s/it]"
+ }
+ },
+ "1ffd6a8ce6a94bdc93a0a380facb573e": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "8cf991e531204a56a5af81ea2898f704": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "c3360cc53a6e42d9af6e2262cf86d051": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "c9eec2a0fc6b4edc9c19f231b055ec9b": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "44b44e629a0c43199ffa6eee0882c091": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "74ba3634127e4b9185b25e48ba7ebe3a": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "dbf30f5fe7214c129d324bdca133973a": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "0631ef1ac59a40dcb194ea0bf2ba94b6": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_fcfd184cac4a465cbd14acc875e0aae2",
+ "IPY_MODEL_8b3ee7c84008414797145b48495f4b5a",
+ "IPY_MODEL_5107bfef46f54ed497b67cd94a714487"
+ ],
+ "layout": "IPY_MODEL_d500ad0d5e7b40d8896ce43379326591"
+ }
+ },
+ "fcfd184cac4a465cbd14acc875e0aae2": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_5ab9e4d9c0b44b8b9a840237e2c01aa3",
+ "placeholder": "",
+ "style": "IPY_MODEL_ffbe40c06c804f18ba8c0558ff9438ba",
+ "value": "model-00001-of-00002.safetensors: 100%"
+ }
+ },
+ "8b3ee7c84008414797145b48495f4b5a": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_fdbc178bbc134dbbb10a4b023db47fb5",
+ "max": 4980712216,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_41bd2e1851684ba0927297ee3319c50a",
+ "value": 4980712216
+ }
+ },
+ "5107bfef46f54ed497b67cd94a714487": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_20f84060e82842ae96702084c1f8a82b",
+ "placeholder": "",
+ "style": "IPY_MODEL_61a698c2dcba4f07a814ac567d4bc256",
+ "value": " 4.98G/4.98G [02:03<00:00, 42.0MB/s]"
+ }
+ },
+ "d500ad0d5e7b40d8896ce43379326591": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "5ab9e4d9c0b44b8b9a840237e2c01aa3": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "ffbe40c06c804f18ba8c0558ff9438ba": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "fdbc178bbc134dbbb10a4b023db47fb5": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "41bd2e1851684ba0927297ee3319c50a": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "20f84060e82842ae96702084c1f8a82b": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "61a698c2dcba4f07a814ac567d4bc256": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "252f7db506bb41ec986f88ea4d5d4d36": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_87b052bf69844867919c0d1de6754046",
+ "IPY_MODEL_ab236cd071364387b3ed3ea97c8e3b4d",
+ "IPY_MODEL_b3a1e5e7bad542f3974e4e067ed76640"
+ ],
+ "layout": "IPY_MODEL_168fac509c8b4b3c9b03e7ee13f8dd52"
+ }
+ },
+ "87b052bf69844867919c0d1de6754046": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_b32729d9635e406884a8345ce61ad536",
+ "placeholder": "",
+ "style": "IPY_MODEL_a9d45e528eb243ba81124e8641812001",
+ "value": "model-00002-of-00002.safetensors: 100%"
+ }
+ },
+ "ab236cd071364387b3ed3ea97c8e3b4d": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_7c99dc6dd7834c7b9c7b96d9e690b49f",
+ "max": 610215224,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_7ad156904fc54b3187dd7fa260ee40dc",
+ "value": 610215224
+ }
+ },
+ "b3a1e5e7bad542f3974e4e067ed76640": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_6b4d66c9cc3c4285b24e114fc7a0c5cc",
+ "placeholder": "",
+ "style": "IPY_MODEL_016f278e55e9413e87687c59f27f77dc",
+ "value": " 610M/610M [00:15<00:00, 41.9MB/s]"
+ }
+ },
+ "168fac509c8b4b3c9b03e7ee13f8dd52": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "b32729d9635e406884a8345ce61ad536": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "a9d45e528eb243ba81124e8641812001": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "7c99dc6dd7834c7b9c7b96d9e690b49f": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "7ad156904fc54b3187dd7fa260ee40dc": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "6b4d66c9cc3c4285b24e114fc7a0c5cc": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "016f278e55e9413e87687c59f27f77dc": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "13ccf5e5dd704b958a4b1d81d83bbe45": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_c47fe8ba1d674cd4b089230ac211ed1a",
+ "IPY_MODEL_c18447aa88b8466aada1604f62a1e193",
+ "IPY_MODEL_5b332bce2ee14a499e7867fe8f429b2d"
+ ],
+ "layout": "IPY_MODEL_043bf4419e49410cbe5fbcc103b4a17c"
+ }
+ },
+ "c47fe8ba1d674cd4b089230ac211ed1a": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_36a72fe07d434fd289844abe34a56bb8",
+ "placeholder": "",
+ "style": "IPY_MODEL_52d85fbff5474c4cb25b28cb55a194a6",
+ "value": "Loading checkpoint shards: 100%"
+ }
+ },
+ "c18447aa88b8466aada1604f62a1e193": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_ba99479495564a5b9b3693a395828784",
+ "max": 2,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_7e712c6fb44445a987c858bd8bdd347b",
+ "value": 2
+ }
+ },
+ "5b332bce2ee14a499e7867fe8f429b2d": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_383aa217c6a848e191b421cc4a0346bf",
+ "placeholder": "",
+ "style": "IPY_MODEL_538ef4577808453d8f3e6f6edc36ee1c",
+ "value": " 2/2 [00:27<00:00, 11.83s/it]"
+ }
+ },
+ "043bf4419e49410cbe5fbcc103b4a17c": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "36a72fe07d434fd289844abe34a56bb8": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "52d85fbff5474c4cb25b28cb55a194a6": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "ba99479495564a5b9b3693a395828784": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "7e712c6fb44445a987c858bd8bdd347b": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "383aa217c6a848e191b421cc4a0346bf": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "538ef4577808453d8f3e6f6edc36ee1c": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "ffc624464e7f44ca9950e17570e70a99": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_60d4de86cf364df0935b5e1f19b2c6be",
+ "IPY_MODEL_f7dc91d8904946a780e86ce4f0f4d5ed",
+ "IPY_MODEL_dab01d139ae243cfa0389c5079ed3bfe"
+ ],
+ "layout": "IPY_MODEL_2ae8c5f6175c493cbc8e96552705ba37"
+ }
+ },
+ "60d4de86cf364df0935b5e1f19b2c6be": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_4a9cdbfe12ac45be984b3a8f73d29dc1",
+ "placeholder": "",
+ "style": "IPY_MODEL_c84f0d47fd3942be964ca7010f13c348",
+ "value": "generation_config.json: 100%"
+ }
+ },
+ "f7dc91d8904946a780e86ce4f0f4d5ed": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_eac19f45ccb54329b42bbcb19a1f2fd4",
+ "max": 132,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_5f353fa6b6f54b5ba9428ce4d8f3f1be",
+ "value": 132
+ }
+ },
+ "dab01d139ae243cfa0389c5079ed3bfe": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_6465f64833024879b6ca055ceed6ed9d",
+ "placeholder": "",
+ "style": "IPY_MODEL_281ea8998cbf40ee855310d991e979b8",
+ "value": " 132/132 [00:00<00:00, 9.49kB/s]"
+ }
+ },
+ "2ae8c5f6175c493cbc8e96552705ba37": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "4a9cdbfe12ac45be984b3a8f73d29dc1": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "c84f0d47fd3942be964ca7010f13c348": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "eac19f45ccb54329b42bbcb19a1f2fd4": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "5f353fa6b6f54b5ba9428ce4d8f3f1be": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "6465f64833024879b6ca055ceed6ed9d": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "281ea8998cbf40ee855310d991e979b8": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "780c1ae797ee48cb97e2530eb2a8a49f": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_651fc5f1f3384c77a96380a2e35a9ac4",
+ "IPY_MODEL_9a37ef338ef74693ba6547b246e432a3",
+ "IPY_MODEL_1ef299925fa7408a9374be0b740a9e95"
+ ],
+ "layout": "IPY_MODEL_ff9bfd5baa2e496dbe4d8c2a7cad3b93"
+ }
+ },
+ "651fc5f1f3384c77a96380a2e35a9ac4": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_35597aaf146943999889a889041a2363",
+ "placeholder": "",
+ "style": "IPY_MODEL_396417cb735d4e879e3592274563377d",
+ "value": "Map: 100%"
+ }
+ },
+ "9a37ef338ef74693ba6547b246e432a3": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_920d3a1046604736a4adea3d06c91c46",
+ "max": 8569,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_38f10f50c1de4041a647c36051439196",
+ "value": 8569
+ }
+ },
+ "1ef299925fa7408a9374be0b740a9e95": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_bd73e52a62554625a6ffa35de8b1fcb4",
+ "placeholder": "",
+ "style": "IPY_MODEL_b2bf77031dbb4704a7c5db2092e96b79",
+ "value": " 8569/8569 [00:10<00:00, 614.96 examples/s]"
+ }
+ },
+ "ff9bfd5baa2e496dbe4d8c2a7cad3b93": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "35597aaf146943999889a889041a2363": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "396417cb735d4e879e3592274563377d": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "920d3a1046604736a4adea3d06c91c46": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "38f10f50c1de4041a647c36051439196": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "bd73e52a62554625a6ffa35de8b1fcb4": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "b2bf77031dbb4704a7c5db2092e96b79": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "b412f8a8fba5467cb11facd8ec1aedf4": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HBoxModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HBoxModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HBoxView",
+ "box_style": "",
+ "children": [
+ "IPY_MODEL_844556f6f4f5414f8cb94a05ba81e5f3",
+ "IPY_MODEL_16402df70c754eacacf0e2c75790248b",
+ "IPY_MODEL_9923bcd6780044cbb60d110320cb3fa3"
+ ],
+ "layout": "IPY_MODEL_35761e009c8d4882b6a2fb40c363f372"
+ }
+ },
+ "844556f6f4f5414f8cb94a05ba81e5f3": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_897879b0d7dd44498eb3dd9b882e943c",
+ "placeholder": "",
+ "style": "IPY_MODEL_c59dbd844df0496b811ff3793d4827c6",
+ "value": "Map: 100%"
+ }
+ },
+ "16402df70c754eacacf0e2c75790248b": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "FloatProgressModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "FloatProgressModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "ProgressView",
+ "bar_style": "success",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_4ab4dd1eb03547bc9631ea18caf21881",
+ "max": 87,
+ "min": 0,
+ "orientation": "horizontal",
+ "style": "IPY_MODEL_6fff8b423cb84d03b68049989a4f1174",
+ "value": 87
+ }
+ },
+ "9923bcd6780044cbb60d110320cb3fa3": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "HTMLModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_dom_classes": [],
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "HTMLModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/controls",
+ "_view_module_version": "1.5.0",
+ "_view_name": "HTMLView",
+ "description": "",
+ "description_tooltip": null,
+ "layout": "IPY_MODEL_376c9b894ccb4c8aa00e06adba02ad9a",
+ "placeholder": "",
+ "style": "IPY_MODEL_c65ff75932ad45ffb417949562c68332",
+ "value": " 87/87 [00:00<00:00, 392.42 examples/s]"
+ }
+ },
+ "35761e009c8d4882b6a2fb40c363f372": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "897879b0d7dd44498eb3dd9b882e943c": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "c59dbd844df0496b811ff3793d4827c6": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ },
+ "4ab4dd1eb03547bc9631ea18caf21881": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "6fff8b423cb84d03b68049989a4f1174": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "ProgressStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "ProgressStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "bar_color": null,
+ "description_width": ""
+ }
+ },
+ "376c9b894ccb4c8aa00e06adba02ad9a": {
+ "model_module": "@jupyter-widgets/base",
+ "model_name": "LayoutModel",
+ "model_module_version": "1.2.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/base",
+ "_model_module_version": "1.2.0",
+ "_model_name": "LayoutModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "LayoutView",
+ "align_content": null,
+ "align_items": null,
+ "align_self": null,
+ "border": null,
+ "bottom": null,
+ "display": null,
+ "flex": null,
+ "flex_flow": null,
+ "grid_area": null,
+ "grid_auto_columns": null,
+ "grid_auto_flow": null,
+ "grid_auto_rows": null,
+ "grid_column": null,
+ "grid_gap": null,
+ "grid_row": null,
+ "grid_template_areas": null,
+ "grid_template_columns": null,
+ "grid_template_rows": null,
+ "height": null,
+ "justify_content": null,
+ "justify_items": null,
+ "left": null,
+ "margin": null,
+ "max_height": null,
+ "max_width": null,
+ "min_height": null,
+ "min_width": null,
+ "object_fit": null,
+ "object_position": null,
+ "order": null,
+ "overflow": null,
+ "overflow_x": null,
+ "overflow_y": null,
+ "padding": null,
+ "right": null,
+ "top": null,
+ "visibility": null,
+ "width": null
+ }
+ },
+ "c65ff75932ad45ffb417949562c68332": {
+ "model_module": "@jupyter-widgets/controls",
+ "model_name": "DescriptionStyleModel",
+ "model_module_version": "1.5.0",
+ "state": {
+ "_model_module": "@jupyter-widgets/controls",
+ "_model_module_version": "1.5.0",
+ "_model_name": "DescriptionStyleModel",
+ "_view_count": null,
+ "_view_module": "@jupyter-widgets/base",
+ "_view_module_version": "1.2.0",
+ "_view_name": "StyleView",
+ "description_width": ""
+ }
+ }
+ }
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 0
+}
\ No newline at end of file