{ "cells": [ { "cell_type": "code", "execution_count": 13, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "8_v2Zzbc_WRt", "outputId": "50b46b10-01f9-4ed7-8278-3413f87bd7c6" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Requirement already satisfied: datasets in /usr/local/lib/python3.10/dist-packages (2.20.0)\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from datasets) (3.15.1)\n", "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from datasets) (1.25.2)\n", "Requirement already satisfied: pyarrow>=15.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (16.1.0)\n", "Requirement already satisfied: pyarrow-hotfix in /usr/local/lib/python3.10/dist-packages (from datasets) (0.6)\n", "Requirement already satisfied: dill<0.3.9,>=0.3.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.3.8)\n", "Requirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (from datasets) (2.0.3)\n", "Requirement already satisfied: requests>=2.32.2 in /usr/local/lib/python3.10/dist-packages (from datasets) (2.32.3)\n", "Requirement already satisfied: tqdm>=4.66.3 in /usr/local/lib/python3.10/dist-packages (from datasets) (4.66.4)\n", "Requirement already satisfied: xxhash in /usr/local/lib/python3.10/dist-packages (from datasets) (3.4.1)\n", "Requirement already satisfied: multiprocess in /usr/local/lib/python3.10/dist-packages (from datasets) (0.70.16)\n", "Requirement already satisfied: fsspec[http]<=2024.5.0,>=2023.1.0 in /usr/local/lib/python3.10/dist-packages (from datasets) (2023.6.0)\n", "Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets) (3.9.5)\n", "Requirement already satisfied: huggingface-hub>=0.21.2 in /usr/local/lib/python3.10/dist-packages (from datasets) (0.23.4)\n", "Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from datasets) (24.1)\n", "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from datasets) (6.0.1)\n", "Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.3.1)\n", "Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (23.2.0)\n", "Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.4.1)\n", "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (6.0.5)\n", "Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (1.9.4)\n", "Requirement already satisfied: async-timeout<5.0,>=4.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets) (4.0.3)\n", "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub>=0.21.2->datasets) (4.12.2)\n", "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets) (3.3.2)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets) (3.7)\n", "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets) (2.0.7)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests>=2.32.2->datasets) (2024.6.2)\n", "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2.8.2)\n", "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2023.4)\n", "Requirement already satisfied: tzdata>=2022.1 in /usr/local/lib/python3.10/dist-packages (from pandas->datasets) (2024.1)\n", "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.2->pandas->datasets) (1.16.0)\n" ] } ], "source": [ "!pip install datasets" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "_q2UKXTofuvg", "outputId": "288815a8-fe8f-4ff4-e274-02d0a0542284" }, "outputs": [ { "data": { "text/plain": [ "{'a': 0,\n", " 'b': 1,\n", " 'c': 2,\n", " 'd': 3,\n", " 'e': 4,\n", " 'f': 5,\n", " 'g': 6,\n", " 'h': 7,\n", " 'i': 8,\n", " 'j': 9,\n", " 'k': 10,\n", " 'l': 11,\n", " 'm': 12,\n", " 'n': 13,\n", " 'o': 14,\n", " 'p': 15,\n", " 'q': 16,\n", " 'r': 17,\n", " 's': 18,\n", " 't': 19,\n", " 'u': 20,\n", " 'v': 21,\n", " 'w': 22,\n", " 'x': 23,\n", " 'y': 24,\n", " 'z': 25}" ] }, "execution_count": 1, "metadata": {}, "output_type": "execute_result" } ], "source": [ "import torch\n", "import torch.nn as nn\n", "import torch.nn.functional as F\n", "import string\n", "\n", "# 定义字典\n", "char2indx = {s: i for i, s in enumerate(string.ascii_lowercase)}\n", "char2indx" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "nfJTv6htym9a", "outputId": "f8aa88cb-e100-4737-a5ba-e02aa099fc5c" }, "outputs": [ { "data": { "text/plain": [ "tensor([11, 14, 21, 4])" ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "example = 'love'\n", "idx = []\n", "\n", "for i in example:\n", " idx.append(char2indx[i])\n", "\n", "idx = torch.tensor(idx)\n", "idx" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "QQPzr1v3y8k4", "outputId": "056054db-d375-46f4-d838-9dfa34b21483" }, "outputs": [ { "data": { "text/plain": [ "(tensor([[0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 1., 0., 0., 0., 0., 0., 0.,\n", " 0., 0., 0., 0., 0., 0., 0., 0.],\n", " [0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 1., 0., 0., 0.,\n", " 0., 0., 0., 0., 0., 0., 0., 0.],\n", " [0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.,\n", " 0., 0., 0., 1., 0., 0., 0., 0.],\n", " [0., 0., 0., 0., 1., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0., 0.,\n", " 0., 0., 0., 0., 0., 0., 0., 0.]]),\n", " torch.Size([4, 26]))" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "# 使用独热编码,将文本转换为二维张量\n", "num_claz = len(char2indx.keys())\n", "x = F.one_hot(idx, num_classes=num_claz).float()\n", "x, x.shape" ] }, { "cell_type": "code", "execution_count": 6, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "XLFzlIiPzlFP", "outputId": "001f5b4c-cd25-4e37-9503-b515b27f6271" }, "outputs": [ { "data": { "text/plain": [ "(tensor([[ 0.3965, -0.3958, -1.2064, -0.6724, -0.4768],\n", " [ 0.9620, 0.5876, 0.8376, -0.4350, -0.3379],\n", " [-2.5578, -0.0305, -0.2124, -0.5916, 0.1987],\n", " [-0.0834, 0.4715, 1.7552, -0.3915, 1.9801]]),\n", " torch.Size([4, 5]))" ] }, "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dims = 5\n", "num_claz = len(char2indx.keys())\n", "x = F.one_hot(idx, num_classes=num_claz).float()\n", "w = torch.randn(num_claz, dims)\n", "(x @ w), (x @ w).shape" ] }, { "cell_type": "code", "execution_count": 7, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "fI9sMtsr0FxX", "outputId": "bf610d5d-a303-48ce-ad3b-b669aab8e166" }, "outputs": [ { "data": { "text/plain": [ "(tensor([[ 0.3965, -0.3958, -1.2064, -0.6724, -0.4768],\n", " [ 0.9620, 0.5876, 0.8376, -0.4350, -0.3379],\n", " [-2.5578, -0.0305, -0.2124, -0.5916, 0.1987],\n", " [-0.0834, 0.4715, 1.7552, -0.3915, 1.9801]]),\n", " torch.Size([4, 5]))" ] }, "execution_count": 7, "metadata": {}, "output_type": "execute_result" } ], "source": [ "w[idx], w[idx].shape" ] }, { "cell_type": "code", "execution_count": 8, "metadata": { "id": "MXIyfigQ0aL0" }, "outputs": [], "source": [ "class Embedding:\n", "\n", " def __init__(self, num_embeddings, embedding_dims):\n", " self.weight = torch.randn((num_embeddings, embedding_dims), requires_grad=True)\n", "\n", " def __call__(self, x):\n", " self.out = self.weight[x]\n", " return self.out\n", "\n", " def parameters(self):\n", " return [self.weight]" ] }, { "cell_type": "code", "execution_count": 9, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "np2OATD71FOo", "outputId": "363f16ce-13cc-4e67-a6e3-675d40df60ec" }, "outputs": [ { "data": { "text/plain": [ "torch.Size([10, 5])" ] }, "execution_count": 9, "metadata": {}, "output_type": "execute_result" } ], "source": [ "em = Embedding(num_claz, 5)\n", "x = torch.randint(0, num_claz, (10, ))\n", "em(x).shape" ] }, { "cell_type": "code", "execution_count": 10, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "5IYT4WkO1YPG", "outputId": "e7c2ac1e-777a-442b-9037-00f2583e9f78" }, "outputs": [ { "data": { "text/plain": [ "torch.Size([20, 10, 5])" ] }, "execution_count": 10, "metadata": {}, "output_type": "execute_result" } ], "source": [ "x = torch.randint(0, num_claz, (20, 10))\n", "em(x).shape" ] }, { "cell_type": "code", "execution_count": 11, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "s12aaPrT1ijj", "outputId": "3cccacd6-9e3f-4288-8df0-9a0df443ba70" }, "outputs": [ { "data": { "text/plain": [ "True" ] }, "execution_count": 11, "metadata": {}, "output_type": "execute_result" } ], "source": [ "torch.cuda.is_available()" ] }, { "cell_type": "code", "execution_count": 12, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "Qu238sYE_Gq_", "outputId": "4662e23b-3bc4-4140-d28b-e5f622559212" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "_CudaDeviceProperties(name='Tesla T4', major=7, minor=5, total_memory=15102MB, multi_processor_count=40)\n" ] } ], "source": [ "for i in range(torch.cuda.device_count()):\n", " print(torch.cuda.get_device_properties(i))" ] }, { "cell_type": "code", "execution_count": 14, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "K0acVkVI_P14", "outputId": "31d1785f-9c74-4b61-f355-4591b957bdfc" }, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 14, "metadata": {}, "output_type": "execute_result" } ], "source": [ "import torch.optim as optim\n", "from torch.utils.data import DataLoader\n", "from datasets import load_dataset\n", "import matplotlib.pyplot as plt\n", "\n", "torch.manual_seed(12046)" ] }, { "cell_type": "code", "execution_count": 48, "metadata": { "id": "O7eABnOnJBXy" }, "outputs": [], "source": [ "device = 'cuda' if torch.cuda.is_available else 'cpu'\n", "batch_size = 1000\n", "learning_rate = 0.01\n", "eval_iters = 10" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "感谢Wanghaha(xufengnian-bei)的贡献,如果在下载过程中遇到网络问题,请使用下面的步骤进行处理。\n", "\n", "* 访问 Hugging Face 数据集页面: https://huggingface.co/datasets/code_search_net\n", "* 在页面上找到 \"Files and versions\" 部分。\n", "* 点击data文件夹,下载对应的python.zip\n", "\n", "修改对应下载文件代码:\n", "\n", "datasets = load_dataset('json', data_files='data/python/python/final/jsonl/train/*.jsonl.gz') # 更换为自己的目录\n", "datasets = datasets['train'].filter(lambda x: 'apache/spark' in x['repo']) # 这里repository_name 更换为 repo\n", "\n", "print(datasets[8]['original_string']) # whole_func_string 更换为 original_string" ] }, { "cell_type": "code", "execution_count": 15, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 440, "referenced_widgets": [ "2bed0a97406e46b9bf1c07e66be77dd5", "0dc5926e3ba0499a918a1c3cbfe862f3", "b704286c3f2c4fa7bcbbc6e6d4b57fb6", "49c33407cf8649bd95f63cf1ee22751b", "e62ac2ea2f8448ee8232dd70eb9850d8", "e2feea769fc14391bb944122c2e808e1", "5cb0d5f4438749eb9f24fe4aa50ab6b7", "a245080a91284641900af30ffbb70577", "1b5de35016af4f5686c1a09c3bcf88cd", "f5b190ba8db74c789b25bf8869d44f6b", "5a4d6fbda05e45f4b78368d4f02c6c38", "7dd2552a36ca4819a20c96cdbeed3e36", "26dfd6520e8049038e69114766b9a0ff", "bbbd5b6f8f44455faf0a031466b2702f", "6c6403ef2e0f482599d0e54d58481f39", "b35467fc4f9041fd9ce882eecd2a6021", "a60bb837834b44378e178e4d9b1a52d4", "b70d024a38864d6bb557bff17ae95d88", "50b76f3d1f3b4bebab396b6bca23e48b", "5d410efac6014533bc1ba839a05d0aaa", "c5453de040db461dae54c65cfadb8d39", "b0f0fc0e102a4acc995a8cc1641074d9", "7ab21750b1a0415d80f9f6f5aea4c13d", "8ef34aff5e9f4096add539f7f6ae29f2", "25e19856014d44c9b762cd7a1f8dc319", "5504bb59eb6e47f79d3b91d42db65911", "bab3bf9895a04dfdbdc76dc642311197", "a3cda732dbfb4a2f9768203548af20f5", "77efb896627947cfa3bdf21f9414cb8a", "4ab8ec295f644193b088d95a3a9b3ec5", "3298fe74f69146bbbbe364c2c4fe5332", "3c5b9b565db14586a40a4a8e54ebe7d3", "89502573192842bd8070a3d3120da01b", "4cbe13efb5dc40b0a7eebd9f7defffc6", "b9b6cf9874544468879f3302cbafdd0f", "09da2bb790a54c179f481d531d3405eb", "d5965607686242799233b3d462319eed", "2387b751d5d6472d8d8f8e7c030338af", "3f3463f177334349836d9cdc25fea796", "142b9dcdc4514ea684c2d0522746e0af", "179ba1b4b8b24b9eadc81a645ed702c8", "1d61f57335364ca0b02a0bd32b56fec6", "6b7f47c502144cafb10942d2f1987e78", "00bb3ff456444b0397816f21490a90f2", "afeb10d4301f44ae9728fc2ef77291a2", "df2c621d9afd438482ea96e8803d56c7", "d312591650f940e797746320007f3ef2", "57706c85ad7a44f4927b7f4e9c6fca75", "6f9585f9022c4360bcc6b5610b33600a", "f492252b9930497fb55837093a9d130f", "94bfa0c5b77e4bd2b17ff94739b457fe", "7d7c7114ff6041e7ae8b48624bba47fa", "08ac8d7ac893490f8cd625568cf4e5d1", "827d8054dfaa49edb71192929b9d6495", "80e437bb9dab47b6b0f4892a21847349", "f402ab9afaa24efda0494e78ba44b3cb", "d35c100aed8743efa1b0df5a7e89308c", "869716edc1fe4dcc99a8880d9033f773", "7c25ae55118e4ec7ae7bffc25a0ae43e", "4d2392c4d43142ca9b8d01b7b2ebb5fd", "81a506124060495d9dc6b59eba2e2490", "2c794c7d98024cbdb38a1ec3e5ccb31a", "3742bf06e2f540fb9d8786d7d2c8f317", "f441707f8fad401883c1220b2e360ff4", "23f6fe5d77c647c5b2c546b82b03667b", "82b0e10b205e48a8832bb8e8fbbb8160", "8fa918d042164c879da4bd580192fdad", "393fa623e36f4be992837c4d901fa23e", "b79a434bbbd44b41b0c2c94d794858ca", "39cc1628e42a4ecebe1e7541416a388d", "c896952f04184bd29b9e796fe0bbfa42", "7a9fb712ced44bf5bc48a4d53c60eeb5", "deb24f274ab3445eb1d02106a6d6e9cf", "4d562acc0dcb490992a549f0d3504627", "7d2ec54cf30c495791e3a338b2168dd1", "53b2163f134f4f9ca0fed9fbc431a4ec", "08d8c742014645279744eff2763845bd" ] }, "id": "KV9eGNEG_f0H", "outputId": "ec85b30d-0af9-46f9-fa73-cca305931016" }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/usr/local/lib/python3.10/dist-packages/huggingface_hub/utils/_token.py:89: UserWarning: \n", "The secret `HF_TOKEN` does not exist in your Colab secrets.\n", "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n", "You will be able to reuse this secret in all of your notebooks.\n", "Please note that authentication is recommended but still optional to access public models or datasets.\n", " warnings.warn(\n" ] }, { "data": { "application/vnd.jupyter.widget-view+json": { "model_id": "2bed0a97406e46b9bf1c07e66be77dd5", "version_major": 2, "version_minor": 0 }, "text/plain": [ "Downloading builder script: 0%| | 0.00/8.44k [00:00'] = begin_ind\n", " self.char2ind['<|e|>'] = end_ind\n", " self.ind2char = {v: k for k, v in self.char2ind.items()}\n", " self.begin_ind = begin_ind\n", " self.end_ind = end_ind\n", "\n", " def encode(self, x):\n", " # x: str\n", " return [self.char2ind[i] for i in x]\n", "\n", " def decode(self, x):\n", " # x: int or list[x]\n", " if isinstance(x, int):\n", " return self.ind2char[x]\n", " return [self.ind2char[i] for i in x]" ] }, { "cell_type": "code", "execution_count": 24, "metadata": { "id": "KkRi-pkyE5Ko" }, "outputs": [], "source": [ "tokenizer = CharTokenizer(datasets['whole_func_string'])" ] }, { "cell_type": "code", "execution_count": 25, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "D0Sd5bVpE_EN", "outputId": "decbfd77-e3f7-4f0a-e93e-7188b082b514" }, "outputs": [ { "data": { "text/plain": [ "[71, 72, 73, 3, 73, 11, 91, 12, 29]" ] }, "execution_count": 25, "metadata": {}, "output_type": "execute_result" } ], "source": [ "test_str = 'def f(x):'\n", "re = tokenizer.encode(test_str)\n", "re" ] }, { "cell_type": "code", "execution_count": 27, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 35 }, "id": "JlZLjjEpFHTP", "outputId": "58a9bcb9-680e-47e6-af5e-de5546642f23" }, "outputs": [ { "data": { "application/vnd.google.colaboratory.intrinsic+json": { "type": "string" }, "text/plain": [ "'def f(x):'" ] }, "execution_count": 27, "metadata": {}, "output_type": "execute_result" } ], "source": [ "''.join(tokenizer.decode(re))" ] }, { "cell_type": "code", "execution_count": 28, "metadata": { "id": "c5uc4QMPFXKx" }, "outputs": [], "source": [ "def autoregressive_trans(text, tokenizer, context_length=10):\n", " # text: str\n", " inputs, labels = [], []\n", " bind = tokenizer.begin_ind\n", " eind = tokenizer.end_ind\n", " enc = tokenizer.encode(text)\n", " # 增加特殊字符\n", " data = [bind] * context_length + enc + [eind]\n", " for i in range(len(data) - context_length):\n", " inputs.append(data[i: i + context_length])\n", " labels.append(data[i + context_length])\n", " return inputs, labels" ] }, { "cell_type": "code", "execution_count": 31, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "PwulyuENGUWH", "outputId": "29cb4625-9668-40f5-ee25-6dff7e57eea6" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "<|b|><|b|><|b|> -----> d\n", "<|b|><|b|>d -----> e\n", "<|b|>de -----> f\n", "def -----> \n", "ef -----> f\n", "f f -----> (\n", " f( -----> x\n", "f(x -----> )\n", "(x) -----> :\n", "x): -----> <|e|>\n" ] } ], "source": [ "inputs, labels = autoregressive_trans(test_str, tokenizer, 3)\n", "for a, b in zip(inputs, labels):\n", " print(f'{\"\".join(tokenizer.decode(a))} -----> {tokenizer.decode(b)}')" ] }, { "cell_type": "code", "execution_count": 32, "metadata": { "id": "75zAbCZVGfG2" }, "outputs": [], "source": [ "def process(data, tokenizer):\n", " text = data['whole_func_string']\n", " # text: str\n", " if isinstance(text, str):\n", " inputs, labels = autoregressive_trans(text, tokenizer)\n", " return {'inputs': inputs, 'labels': labels}\n", " # text: list[str]\n", " inputs, labels = [], []\n", " for t in text:\n", " i, l = autoregressive_trans(t, tokenizer)\n", " inputs += i\n", " labels += l\n", " return {'inputs': inputs, 'labels': labels}" ] }, { "cell_type": "code", "execution_count": 33, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "Yc9kF5c-ITm9", "outputId": "354ab6df-8681-448e-d33a-bf32fd5d8117" }, "outputs": [ { "data": { "text/plain": [ "{'inputs': [[0, 0, 0, 0, 0, 0, 0, 0, 0, 0],\n", " [0, 0, 0, 0, 0, 0, 0, 0, 0, 71],\n", " [0, 0, 0, 0, 0, 0, 0, 0, 71, 72],\n", " [0, 0, 0, 0, 0, 0, 0, 71, 72, 73],\n", " [0, 0, 0, 0, 0, 0, 71, 72, 73, 3],\n", " [0, 0, 0, 0, 0, 71, 72, 73, 3, 87],\n", " [0, 0, 0, 0, 71, 72, 73, 3, 87, 82],\n", " [0, 0, 0, 71, 72, 73, 3, 87, 82, 66],\n", " [0, 0, 71, 72, 73, 3, 87, 82, 66, 68],\n", " [0, 71, 72, 73, 3, 87, 82, 66, 68, 85],\n", " [71, 72, 73, 3, 87, 82, 66, 68, 85, 85],\n", " [72, 73, 3, 87, 82, 66, 68, 85, 85, 82],\n", " [73, 3, 87, 82, 66, 68, 85, 85, 82, 90],\n", " [3, 87, 82, 66, 68, 85, 85, 82, 90, 66],\n", " [87, 82, 66, 68, 85, 85, 82, 90, 66, 86],\n", " [82, 66, 68, 85, 85, 82, 90, 66, 86, 70],\n", " [66, 68, 85, 85, 82, 90, 66, 86, 70, 75],\n", " [68, 85, 85, 82, 90, 66, 86, 70, 75, 72],\n", " [85, 85, 82, 90, 66, 86, 70, 75, 72, 80],\n", " [85, 82, 90, 66, 86, 70, 75, 72, 80, 68],\n", " [82, 90, 66, 86, 70, 75, 72, 80, 68, 11],\n", " [90, 66, 86, 70, 75, 72, 80, 68, 11, 86],\n", " [66, 86, 70, 75, 72, 80, 68, 11, 86, 70],\n", " [86, 70, 75, 72, 80, 68, 11, 86, 70, 75],\n", " [70, 75, 72, 80, 68, 11, 86, 70, 75, 72],\n", " [75, 72, 80, 68, 11, 86, 70, 75, 72, 80],\n", " [72, 80, 68, 11, 86, 70, 75, 72, 80, 68],\n", " [80, 68, 11, 86, 70, 75, 72, 80, 68, 12],\n", " [68, 11, 86, 70, 75, 72, 80, 68, 12, 29],\n", " [11, 86, 70, 75, 72, 80, 68, 12, 29, 2],\n", " [86, 70, 75, 72, 80, 68, 12, 29, 2, 3],\n", " [70, 75, 72, 80, 68, 12, 29, 2, 3, 3],\n", " [75, 72, 80, 68, 12, 29, 2, 3, 3, 3],\n", " [72, 80, 68, 12, 29, 2, 3, 3, 3, 3],\n", " [80, 68, 12, 29, 2, 3, 3, 3, 3, 5],\n", " [68, 12, 29, 2, 3, 3, 3, 3, 5, 5],\n", " [12, 29, 2, 3, 3, 3, 3, 5, 5, 5],\n", " [29, 2, 3, 3, 3, 3, 5, 5, 5, 3],\n", " [2, 3, 3, 3, 3, 5, 5, 5, 3, 38],\n", " [3, 3, 3, 3, 5, 5, 5, 3, 38, 82],\n", " [3, 3, 3, 5, 5, 5, 3, 38, 82, 81],\n", " [3, 3, 5, 5, 5, 3, 38, 82, 81, 89],\n", " [3, 5, 5, 5, 3, 38, 82, 81, 89, 72],\n", " [5, 5, 5, 3, 38, 82, 81, 89, 72, 85],\n", " [5, 5, 3, 38, 82, 81, 89, 72, 85, 87],\n", " [5, 3, 38, 82, 81, 89, 72, 85, 87, 3],\n", " [3, 38, 82, 81, 89, 72, 85, 87, 3, 68],\n", " [38, 82, 81, 89, 72, 85, 87, 3, 68, 3],\n", " [82, 81, 89, 72, 85, 87, 3, 68, 3, 86],\n", " [81, 89, 72, 85, 87, 3, 68, 3, 86, 70],\n", " [89, 72, 85, 87, 3, 68, 3, 86, 70, 75],\n", " [72, 85, 87, 3, 68, 3, 86, 70, 75, 72],\n", " [85, 87, 3, 68, 3, 86, 70, 75, 72, 80],\n", " [87, 3, 68, 3, 86, 70, 75, 72, 80, 68],\n", " [3, 68, 3, 86, 70, 75, 72, 80, 68, 3],\n", " [68, 3, 86, 70, 75, 72, 80, 68, 3, 73],\n", " [3, 86, 70, 75, 72, 80, 68, 3, 73, 85],\n", " [86, 70, 75, 72, 80, 68, 3, 73, 85, 82],\n", " [70, 75, 72, 80, 68, 3, 73, 85, 82, 80],\n", " [75, 72, 80, 68, 3, 73, 85, 82, 80, 3],\n", " [72, 80, 68, 3, 73, 85, 82, 80, 3, 54],\n", " [80, 68, 3, 73, 85, 82, 80, 3, 54, 83],\n", " [68, 3, 73, 85, 82, 80, 3, 54, 83, 68],\n", " [3, 73, 85, 82, 80, 3, 54, 83, 68, 85],\n", " [73, 85, 82, 80, 3, 54, 83, 68, 85, 78],\n", " [85, 82, 80, 3, 54, 83, 68, 85, 78, 3],\n", " [82, 80, 3, 54, 83, 68, 85, 78, 3, 87],\n", " [80, 3, 54, 83, 68, 85, 78, 3, 87, 82],\n", " [3, 54, 83, 68, 85, 78, 3, 87, 82, 3],\n", " [54, 83, 68, 85, 78, 3, 87, 82, 3, 36],\n", " [83, 68, 85, 78, 3, 87, 82, 3, 36, 85],\n", " [68, 85, 78, 3, 87, 82, 3, 36, 85, 85],\n", " [85, 78, 3, 87, 82, 3, 36, 85, 85, 82],\n", " [78, 3, 87, 82, 3, 36, 85, 85, 82, 90],\n", " [3, 87, 82, 3, 36, 85, 85, 82, 90, 2],\n", " [87, 82, 3, 36, 85, 85, 82, 90, 2, 3],\n", " [82, 3, 36, 85, 85, 82, 90, 2, 3, 3],\n", " [3, 36, 85, 85, 82, 90, 2, 3, 3, 3],\n", " [36, 85, 85, 82, 90, 2, 3, 3, 3, 3],\n", " [85, 85, 82, 90, 2, 3, 3, 3, 3, 5],\n", " [85, 82, 90, 2, 3, 3, 3, 3, 5, 5],\n", " [82, 90, 2, 3, 3, 3, 3, 5, 5, 5],\n", " [90, 2, 3, 3, 3, 3, 5, 5, 5, 2],\n", " [2, 3, 3, 3, 3, 5, 5, 5, 2, 3],\n", " [3, 3, 3, 3, 5, 5, 5, 2, 3, 3],\n", " [3, 3, 3, 5, 5, 5, 2, 3, 3, 3],\n", " [3, 3, 5, 5, 5, 2, 3, 3, 3, 3],\n", " [3, 5, 5, 5, 2, 3, 3, 3, 3, 76],\n", " [5, 5, 5, 2, 3, 3, 3, 3, 76, 80],\n", " [5, 5, 2, 3, 3, 3, 3, 76, 80, 83],\n", " [5, 2, 3, 3, 3, 3, 76, 80, 83, 82],\n", " [2, 3, 3, 3, 3, 76, 80, 83, 82, 85],\n", " [3, 3, 3, 3, 76, 80, 83, 82, 85, 87],\n", " [3, 3, 3, 76, 80, 83, 82, 85, 87, 3],\n", " [3, 3, 76, 80, 83, 82, 85, 87, 3, 83],\n", " [3, 76, 80, 83, 82, 85, 87, 3, 83, 92],\n", " [76, 80, 83, 82, 85, 87, 3, 83, 92, 68],\n", " [80, 83, 82, 85, 87, 3, 83, 92, 68, 85],\n", " [83, 82, 85, 87, 3, 83, 92, 68, 85, 85],\n", " [82, 85, 87, 3, 83, 92, 68, 85, 85, 82],\n", " [85, 87, 3, 83, 92, 68, 85, 85, 82, 90],\n", " [87, 3, 83, 92, 68, 85, 85, 82, 90, 3],\n", " [3, 83, 92, 68, 85, 85, 82, 90, 3, 68],\n", " [83, 92, 68, 85, 85, 82, 90, 3, 68, 86],\n", " [92, 68, 85, 85, 82, 90, 3, 68, 86, 3],\n", " [68, 85, 85, 82, 90, 3, 68, 86, 3, 83],\n", " [85, 85, 82, 90, 3, 68, 86, 3, 83, 68],\n", " [85, 82, 90, 3, 68, 86, 3, 83, 68, 2],\n", " [82, 90, 3, 68, 86, 3, 83, 68, 2, 3],\n", " [90, 3, 68, 86, 3, 83, 68, 2, 3, 3],\n", " [3, 68, 86, 3, 83, 68, 2, 3, 3, 3],\n", " [68, 86, 3, 83, 68, 2, 3, 3, 3, 3],\n", " [86, 3, 83, 68, 2, 3, 3, 3, 3, 73],\n", " [3, 83, 68, 2, 3, 3, 3, 3, 73, 76],\n", " [83, 68, 2, 3, 3, 3, 3, 73, 76, 72],\n", " [68, 2, 3, 3, 3, 3, 73, 76, 72, 79],\n", " [2, 3, 3, 3, 3, 73, 76, 72, 79, 71],\n", " [3, 3, 3, 3, 73, 76, 72, 79, 71, 86],\n", " [3, 3, 3, 73, 76, 72, 79, 71, 86, 3],\n", " [3, 3, 73, 76, 72, 79, 71, 86, 3, 32],\n", " [3, 73, 76, 72, 79, 71, 86, 3, 32, 3],\n", " [73, 76, 72, 79, 71, 86, 3, 32, 3, 62],\n", " [76, 72, 79, 71, 86, 3, 32, 3, 62, 83],\n", " [72, 79, 71, 86, 3, 32, 3, 62, 83, 68],\n", " [79, 71, 86, 3, 32, 3, 62, 83, 68, 17],\n", " [71, 86, 3, 32, 3, 62, 83, 68, 17, 73],\n", " [86, 3, 32, 3, 62, 83, 68, 17, 73, 76],\n", " [3, 32, 3, 62, 83, 68, 17, 73, 76, 72],\n", " [32, 3, 62, 83, 68, 17, 73, 76, 72, 79],\n", " [3, 62, 83, 68, 17, 73, 76, 72, 79, 71],\n", " [62, 83, 68, 17, 73, 76, 72, 79, 71, 11],\n", " [83, 68, 17, 73, 76, 72, 79, 71, 11, 73],\n", " [68, 17, 73, 76, 72, 79, 71, 11, 73, 76],\n", " [17, 73, 76, 72, 79, 71, 11, 73, 76, 72],\n", " [73, 76, 72, 79, 71, 11, 73, 76, 72, 79],\n", " [76, 72, 79, 71, 11, 73, 76, 72, 79, 71],\n", " [72, 79, 71, 11, 73, 76, 72, 79, 71, 17],\n", " [79, 71, 11, 73, 76, 72, 79, 71, 17, 81],\n", " [71, 11, 73, 76, 72, 79, 71, 17, 81, 68],\n", " [11, 73, 76, 72, 79, 71, 17, 81, 68, 80],\n", " [73, 76, 72, 79, 71, 17, 81, 68, 80, 72],\n", " [76, 72, 79, 71, 17, 81, 68, 80, 72, 15],\n", " [72, 79, 71, 17, 81, 68, 80, 72, 15, 3],\n", " [79, 71, 17, 81, 68, 80, 72, 15, 3, 87],\n", " [71, 17, 81, 68, 80, 72, 15, 3, 87, 82],\n", " [17, 81, 68, 80, 72, 15, 3, 87, 82, 66],\n", " [81, 68, 80, 72, 15, 3, 87, 82, 66, 68],\n", " [68, 80, 72, 15, 3, 87, 82, 66, 68, 85],\n", " [80, 72, 15, 3, 87, 82, 66, 68, 85, 85],\n", " [72, 15, 3, 87, 82, 66, 68, 85, 85, 82],\n", " [15, 3, 87, 82, 66, 68, 85, 85, 82, 90],\n", " [3, 87, 82, 66, 68, 85, 85, 82, 90, 66],\n", " [87, 82, 66, 68, 85, 85, 82, 90, 66, 87],\n", " [82, 66, 68, 85, 85, 82, 90, 66, 87, 92],\n", " [66, 68, 85, 85, 82, 90, 66, 87, 92, 83],\n", " [68, 85, 85, 82, 90, 66, 87, 92, 83, 72],\n", " [85, 85, 82, 90, 66, 87, 92, 83, 72, 11],\n", " [85, 82, 90, 66, 87, 92, 83, 72, 11, 73],\n", " [82, 90, 66, 87, 92, 83, 72, 11, 73, 76],\n", " [90, 66, 87, 92, 83, 72, 11, 73, 76, 72],\n", " [66, 87, 92, 83, 72, 11, 73, 76, 72, 79],\n", " [87, 92, 83, 72, 11, 73, 76, 72, 79, 71],\n", " [92, 83, 72, 11, 73, 76, 72, 79, 71, 17],\n", " [83, 72, 11, 73, 76, 72, 79, 71, 17, 71],\n", " [72, 11, 73, 76, 72, 79, 71, 17, 71, 68],\n", " [11, 73, 76, 72, 79, 71, 17, 71, 68, 87],\n", " [73, 76, 72, 79, 71, 17, 71, 68, 87, 68],\n", " [76, 72, 79, 71, 17, 71, 68, 87, 68, 55],\n", " [72, 79, 71, 17, 71, 68, 87, 68, 55, 92],\n", " [79, 71, 17, 71, 68, 87, 68, 55, 92, 83],\n", " [71, 17, 71, 68, 87, 68, 55, 92, 83, 72],\n", " [17, 71, 68, 87, 68, 55, 92, 83, 72, 12],\n", " [71, 68, 87, 68, 55, 92, 83, 72, 12, 15],\n", " [68, 87, 68, 55, 92, 83, 72, 12, 15, 3],\n", " [87, 68, 55, 92, 83, 72, 12, 15, 3, 81],\n", " [68, 55, 92, 83, 72, 12, 15, 3, 81, 88],\n", " [55, 92, 83, 72, 12, 15, 3, 81, 88, 79],\n", " [92, 83, 72, 12, 15, 3, 81, 88, 79, 79],\n", " [83, 72, 12, 15, 3, 81, 88, 79, 79, 68],\n", " [72, 12, 15, 3, 81, 88, 79, 79, 68, 69],\n", " [12, 15, 3, 81, 88, 79, 79, 68, 69, 79],\n", " [15, 3, 81, 88, 79, 79, 68, 69, 79, 72],\n", " [3, 81, 88, 79, 79, 68, 69, 79, 72, 32],\n", " [81, 88, 79, 79, 68, 69, 79, 72, 32, 73],\n", " [88, 79, 79, 68, 69, 79, 72, 32, 73, 76],\n", " [79, 79, 68, 69, 79, 72, 32, 73, 76, 72],\n", " [79, 68, 69, 79, 72, 32, 73, 76, 72, 79],\n", " [68, 69, 79, 72, 32, 73, 76, 72, 79, 71],\n", " [69, 79, 72, 32, 73, 76, 72, 79, 71, 17],\n", " [79, 72, 32, 73, 76, 72, 79, 71, 17, 81],\n", " [72, 32, 73, 76, 72, 79, 71, 17, 81, 88],\n", " [32, 73, 76, 72, 79, 71, 17, 81, 88, 79],\n", " [73, 76, 72, 79, 71, 17, 81, 88, 79, 79],\n", " [76, 72, 79, 71, 17, 81, 88, 79, 79, 68],\n", " [72, 79, 71, 17, 81, 88, 79, 79, 68, 69],\n", " [79, 71, 17, 81, 88, 79, 79, 68, 69, 79],\n", " [71, 17, 81, 88, 79, 79, 68, 69, 79, 72],\n", " [17, 81, 88, 79, 79, 68, 69, 79, 72, 12],\n", " [81, 88, 79, 79, 68, 69, 79, 72, 12, 2],\n", " [88, 79, 79, 68, 69, 79, 72, 12, 2, 3],\n", " [79, 79, 68, 69, 79, 72, 12, 2, 3, 3],\n", " [79, 68, 69, 79, 72, 12, 2, 3, 3, 3],\n", " [68, 69, 79, 72, 12, 2, 3, 3, 3, 3],\n", " [69, 79, 72, 12, 2, 3, 3, 3, 3, 3],\n", " [79, 72, 12, 2, 3, 3, 3, 3, 3, 3],\n", " [72, 12, 2, 3, 3, 3, 3, 3, 3, 3],\n", " [12, 2, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [2, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 73],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 73, 82],\n", " [3, 3, 3, 3, 3, 3, 3, 73, 82, 85],\n", " [3, 3, 3, 3, 3, 3, 73, 82, 85, 3],\n", " [3, 3, 3, 3, 3, 73, 82, 85, 3, 73],\n", " [3, 3, 3, 3, 73, 82, 85, 3, 73, 76],\n", " [3, 3, 3, 73, 82, 85, 3, 73, 76, 72],\n", " [3, 3, 73, 82, 85, 3, 73, 76, 72, 79],\n", " [3, 73, 82, 85, 3, 73, 76, 72, 79, 71],\n", " [73, 82, 85, 3, 73, 76, 72, 79, 71, 3],\n", " [82, 85, 3, 73, 76, 72, 79, 71, 3, 76],\n", " [85, 3, 73, 76, 72, 79, 71, 3, 76, 81],\n", " [3, 73, 76, 72, 79, 71, 3, 76, 81, 3],\n", " [73, 76, 72, 79, 71, 3, 76, 81, 3, 86],\n", " [76, 72, 79, 71, 3, 76, 81, 3, 86, 70],\n", " [72, 79, 71, 3, 76, 81, 3, 86, 70, 75],\n", " [79, 71, 3, 76, 81, 3, 86, 70, 75, 72],\n", " [71, 3, 76, 81, 3, 86, 70, 75, 72, 80],\n", " [3, 76, 81, 3, 86, 70, 75, 72, 80, 68],\n", " [76, 81, 3, 86, 70, 75, 72, 80, 68, 64],\n", " [81, 3, 86, 70, 75, 72, 80, 68, 64, 2],\n", " [3, 86, 70, 75, 72, 80, 68, 64, 2, 3],\n", " [86, 70, 75, 72, 80, 68, 64, 2, 3, 3],\n", " [70, 75, 72, 80, 68, 64, 2, 3, 3, 3],\n", " [75, 72, 80, 68, 64, 2, 3, 3, 3, 3],\n", " [72, 80, 68, 64, 2, 3, 3, 3, 3, 85],\n", " [80, 68, 64, 2, 3, 3, 3, 3, 85, 72],\n", " [68, 64, 2, 3, 3, 3, 3, 85, 72, 87],\n", " [64, 2, 3, 3, 3, 3, 85, 72, 87, 88],\n", " [2, 3, 3, 3, 3, 85, 72, 87, 88, 85],\n", " [3, 3, 3, 3, 85, 72, 87, 88, 85, 81],\n", " [3, 3, 3, 85, 72, 87, 88, 85, 81, 3],\n", " [3, 3, 85, 72, 87, 88, 85, 81, 3, 83],\n", " [3, 85, 72, 87, 88, 85, 81, 3, 83, 68],\n", " [85, 72, 87, 88, 85, 81, 3, 83, 68, 17],\n", " [72, 87, 88, 85, 81, 3, 83, 68, 17, 86],\n", " [87, 88, 85, 81, 3, 83, 68, 17, 86, 70],\n", " [88, 85, 81, 3, 83, 68, 17, 86, 70, 75],\n", " [85, 81, 3, 83, 68, 17, 86, 70, 75, 72],\n", " [81, 3, 83, 68, 17, 86, 70, 75, 72, 80],\n", " [3, 83, 68, 17, 86, 70, 75, 72, 80, 68],\n", " [83, 68, 17, 86, 70, 75, 72, 80, 68, 11],\n", " [68, 17, 86, 70, 75, 72, 80, 68, 11, 73],\n", " [17, 86, 70, 75, 72, 80, 68, 11, 73, 76],\n", " [86, 70, 75, 72, 80, 68, 11, 73, 76, 72],\n", " [70, 75, 72, 80, 68, 11, 73, 76, 72, 79],\n", " [75, 72, 80, 68, 11, 73, 76, 72, 79, 71],\n", " [72, 80, 68, 11, 73, 76, 72, 79, 71, 86],\n", " [80, 68, 11, 73, 76, 72, 79, 71, 86, 12]],\n", " 'labels': [71,\n", " 72,\n", " 73,\n", " 3,\n", " 87,\n", " 82,\n", " 66,\n", " 68,\n", " 85,\n", " 85,\n", " 82,\n", " 90,\n", " 66,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 11,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 12,\n", " 29,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 5,\n", " 5,\n", " 5,\n", " 3,\n", " 38,\n", " 82,\n", " 81,\n", " 89,\n", " 72,\n", " 85,\n", " 87,\n", " 3,\n", " 68,\n", " 3,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 3,\n", " 73,\n", " 85,\n", " 82,\n", " 80,\n", " 3,\n", " 54,\n", " 83,\n", " 68,\n", " 85,\n", " 78,\n", " 3,\n", " 87,\n", " 82,\n", " 3,\n", " 36,\n", " 85,\n", " 85,\n", " 82,\n", " 90,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 5,\n", " 5,\n", " 5,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 76,\n", " 80,\n", " 83,\n", " 82,\n", " 85,\n", " 87,\n", " 3,\n", " 83,\n", " 92,\n", " 68,\n", " 85,\n", " 85,\n", " 82,\n", " 90,\n", " 3,\n", " 68,\n", " 86,\n", " 3,\n", " 83,\n", " 68,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 86,\n", " 3,\n", " 32,\n", " 3,\n", " 62,\n", " 83,\n", " 68,\n", " 17,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 11,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 17,\n", " 81,\n", " 68,\n", " 80,\n", " 72,\n", " 15,\n", " 3,\n", " 87,\n", " 82,\n", " 66,\n", " 68,\n", " 85,\n", " 85,\n", " 82,\n", " 90,\n", " 66,\n", " 87,\n", " 92,\n", " 83,\n", " 72,\n", " 11,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 17,\n", " 71,\n", " 68,\n", " 87,\n", " 68,\n", " 55,\n", " 92,\n", " 83,\n", " 72,\n", " 12,\n", " 15,\n", " 3,\n", " 81,\n", " 88,\n", " 79,\n", " 79,\n", " 68,\n", " 69,\n", " 79,\n", " 72,\n", " 32,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 17,\n", " 81,\n", " 88,\n", " 79,\n", " 79,\n", " 68,\n", " 69,\n", " 79,\n", " 72,\n", " 12,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 73,\n", " 82,\n", " 85,\n", " 3,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 3,\n", " 76,\n", " 81,\n", " 3,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 64,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 85,\n", " 72,\n", " 87,\n", " 88,\n", " 85,\n", " 81,\n", " 3,\n", " 83,\n", " 68,\n", " 17,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 11,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 86,\n", " 12,\n", " 1]}" ] }, "execution_count": 33, "metadata": {}, "output_type": "execute_result" } ], "source": [ "process(datasets[8], tokenizer)" ] }, { "cell_type": "code", "execution_count": 34, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "oZ_T1eCWIW8u", "outputId": "f013cf74-0655-44e6-b11d-db2d7e04cedc" }, "outputs": [ { "data": { "text/plain": [ "{'inputs': [[0, 0, 0, 0, 0, 0, 0, 0, 0, 0],\n", " [0, 0, 0, 0, 0, 0, 0, 0, 0, 71],\n", " [0, 0, 0, 0, 0, 0, 0, 0, 71, 72],\n", " [0, 0, 0, 0, 0, 0, 0, 71, 72, 73],\n", " [0, 0, 0, 0, 0, 0, 71, 72, 73, 3],\n", " [0, 0, 0, 0, 0, 71, 72, 73, 3, 87],\n", " [0, 0, 0, 0, 71, 72, 73, 3, 87, 82],\n", " [0, 0, 0, 71, 72, 73, 3, 87, 82, 66],\n", " [0, 0, 71, 72, 73, 3, 87, 82, 66, 68],\n", " [0, 71, 72, 73, 3, 87, 82, 66, 68, 85],\n", " [71, 72, 73, 3, 87, 82, 66, 68, 85, 85],\n", " [72, 73, 3, 87, 82, 66, 68, 85, 85, 82],\n", " [73, 3, 87, 82, 66, 68, 85, 85, 82, 90],\n", " [3, 87, 82, 66, 68, 85, 85, 82, 90, 66],\n", " [87, 82, 66, 68, 85, 85, 82, 90, 66, 86],\n", " [82, 66, 68, 85, 85, 82, 90, 66, 86, 70],\n", " [66, 68, 85, 85, 82, 90, 66, 86, 70, 75],\n", " [68, 85, 85, 82, 90, 66, 86, 70, 75, 72],\n", " [85, 85, 82, 90, 66, 86, 70, 75, 72, 80],\n", " [85, 82, 90, 66, 86, 70, 75, 72, 80, 68],\n", " [82, 90, 66, 86, 70, 75, 72, 80, 68, 11],\n", " [90, 66, 86, 70, 75, 72, 80, 68, 11, 86],\n", " [66, 86, 70, 75, 72, 80, 68, 11, 86, 70],\n", " [86, 70, 75, 72, 80, 68, 11, 86, 70, 75],\n", " [70, 75, 72, 80, 68, 11, 86, 70, 75, 72],\n", " [75, 72, 80, 68, 11, 86, 70, 75, 72, 80],\n", " [72, 80, 68, 11, 86, 70, 75, 72, 80, 68],\n", " [80, 68, 11, 86, 70, 75, 72, 80, 68, 12],\n", " [68, 11, 86, 70, 75, 72, 80, 68, 12, 29],\n", " [11, 86, 70, 75, 72, 80, 68, 12, 29, 2],\n", " [86, 70, 75, 72, 80, 68, 12, 29, 2, 3],\n", " [70, 75, 72, 80, 68, 12, 29, 2, 3, 3],\n", " [75, 72, 80, 68, 12, 29, 2, 3, 3, 3],\n", " [72, 80, 68, 12, 29, 2, 3, 3, 3, 3],\n", " [80, 68, 12, 29, 2, 3, 3, 3, 3, 5],\n", " [68, 12, 29, 2, 3, 3, 3, 3, 5, 5],\n", " [12, 29, 2, 3, 3, 3, 3, 5, 5, 5],\n", " [29, 2, 3, 3, 3, 3, 5, 5, 5, 3],\n", " [2, 3, 3, 3, 3, 5, 5, 5, 3, 38],\n", " [3, 3, 3, 3, 5, 5, 5, 3, 38, 82],\n", " [3, 3, 3, 5, 5, 5, 3, 38, 82, 81],\n", " [3, 3, 5, 5, 5, 3, 38, 82, 81, 89],\n", " [3, 5, 5, 5, 3, 38, 82, 81, 89, 72],\n", " [5, 5, 5, 3, 38, 82, 81, 89, 72, 85],\n", " [5, 5, 3, 38, 82, 81, 89, 72, 85, 87],\n", " [5, 3, 38, 82, 81, 89, 72, 85, 87, 3],\n", " [3, 38, 82, 81, 89, 72, 85, 87, 3, 68],\n", " [38, 82, 81, 89, 72, 85, 87, 3, 68, 3],\n", " [82, 81, 89, 72, 85, 87, 3, 68, 3, 86],\n", " [81, 89, 72, 85, 87, 3, 68, 3, 86, 70],\n", " [89, 72, 85, 87, 3, 68, 3, 86, 70, 75],\n", " [72, 85, 87, 3, 68, 3, 86, 70, 75, 72],\n", " [85, 87, 3, 68, 3, 86, 70, 75, 72, 80],\n", " [87, 3, 68, 3, 86, 70, 75, 72, 80, 68],\n", " [3, 68, 3, 86, 70, 75, 72, 80, 68, 3],\n", " [68, 3, 86, 70, 75, 72, 80, 68, 3, 73],\n", " [3, 86, 70, 75, 72, 80, 68, 3, 73, 85],\n", " [86, 70, 75, 72, 80, 68, 3, 73, 85, 82],\n", " [70, 75, 72, 80, 68, 3, 73, 85, 82, 80],\n", " [75, 72, 80, 68, 3, 73, 85, 82, 80, 3],\n", " [72, 80, 68, 3, 73, 85, 82, 80, 3, 54],\n", " [80, 68, 3, 73, 85, 82, 80, 3, 54, 83],\n", " [68, 3, 73, 85, 82, 80, 3, 54, 83, 68],\n", " [3, 73, 85, 82, 80, 3, 54, 83, 68, 85],\n", " [73, 85, 82, 80, 3, 54, 83, 68, 85, 78],\n", " [85, 82, 80, 3, 54, 83, 68, 85, 78, 3],\n", " [82, 80, 3, 54, 83, 68, 85, 78, 3, 87],\n", " [80, 3, 54, 83, 68, 85, 78, 3, 87, 82],\n", " [3, 54, 83, 68, 85, 78, 3, 87, 82, 3],\n", " [54, 83, 68, 85, 78, 3, 87, 82, 3, 36],\n", " [83, 68, 85, 78, 3, 87, 82, 3, 36, 85],\n", " [68, 85, 78, 3, 87, 82, 3, 36, 85, 85],\n", " [85, 78, 3, 87, 82, 3, 36, 85, 85, 82],\n", " [78, 3, 87, 82, 3, 36, 85, 85, 82, 90],\n", " [3, 87, 82, 3, 36, 85, 85, 82, 90, 2],\n", " [87, 82, 3, 36, 85, 85, 82, 90, 2, 3],\n", " [82, 3, 36, 85, 85, 82, 90, 2, 3, 3],\n", " [3, 36, 85, 85, 82, 90, 2, 3, 3, 3],\n", " [36, 85, 85, 82, 90, 2, 3, 3, 3, 3],\n", " [85, 85, 82, 90, 2, 3, 3, 3, 3, 5],\n", " [85, 82, 90, 2, 3, 3, 3, 3, 5, 5],\n", " [82, 90, 2, 3, 3, 3, 3, 5, 5, 5],\n", " [90, 2, 3, 3, 3, 3, 5, 5, 5, 2],\n", " [2, 3, 3, 3, 3, 5, 5, 5, 2, 3],\n", " [3, 3, 3, 3, 5, 5, 5, 2, 3, 3],\n", " [3, 3, 3, 5, 5, 5, 2, 3, 3, 3],\n", " [3, 3, 5, 5, 5, 2, 3, 3, 3, 3],\n", " [3, 5, 5, 5, 2, 3, 3, 3, 3, 76],\n", " [5, 5, 5, 2, 3, 3, 3, 3, 76, 80],\n", " [5, 5, 2, 3, 3, 3, 3, 76, 80, 83],\n", " [5, 2, 3, 3, 3, 3, 76, 80, 83, 82],\n", " [2, 3, 3, 3, 3, 76, 80, 83, 82, 85],\n", " [3, 3, 3, 3, 76, 80, 83, 82, 85, 87],\n", " [3, 3, 3, 76, 80, 83, 82, 85, 87, 3],\n", " [3, 3, 76, 80, 83, 82, 85, 87, 3, 83],\n", " [3, 76, 80, 83, 82, 85, 87, 3, 83, 92],\n", " [76, 80, 83, 82, 85, 87, 3, 83, 92, 68],\n", " [80, 83, 82, 85, 87, 3, 83, 92, 68, 85],\n", " [83, 82, 85, 87, 3, 83, 92, 68, 85, 85],\n", " [82, 85, 87, 3, 83, 92, 68, 85, 85, 82],\n", " [85, 87, 3, 83, 92, 68, 85, 85, 82, 90],\n", " [87, 3, 83, 92, 68, 85, 85, 82, 90, 3],\n", " [3, 83, 92, 68, 85, 85, 82, 90, 3, 68],\n", " [83, 92, 68, 85, 85, 82, 90, 3, 68, 86],\n", " [92, 68, 85, 85, 82, 90, 3, 68, 86, 3],\n", " [68, 85, 85, 82, 90, 3, 68, 86, 3, 83],\n", " [85, 85, 82, 90, 3, 68, 86, 3, 83, 68],\n", " [85, 82, 90, 3, 68, 86, 3, 83, 68, 2],\n", " [82, 90, 3, 68, 86, 3, 83, 68, 2, 3],\n", " [90, 3, 68, 86, 3, 83, 68, 2, 3, 3],\n", " [3, 68, 86, 3, 83, 68, 2, 3, 3, 3],\n", " [68, 86, 3, 83, 68, 2, 3, 3, 3, 3],\n", " [86, 3, 83, 68, 2, 3, 3, 3, 3, 73],\n", " [3, 83, 68, 2, 3, 3, 3, 3, 73, 76],\n", " [83, 68, 2, 3, 3, 3, 3, 73, 76, 72],\n", " [68, 2, 3, 3, 3, 3, 73, 76, 72, 79],\n", " [2, 3, 3, 3, 3, 73, 76, 72, 79, 71],\n", " [3, 3, 3, 3, 73, 76, 72, 79, 71, 86],\n", " [3, 3, 3, 73, 76, 72, 79, 71, 86, 3],\n", " [3, 3, 73, 76, 72, 79, 71, 86, 3, 32],\n", " [3, 73, 76, 72, 79, 71, 86, 3, 32, 3],\n", " [73, 76, 72, 79, 71, 86, 3, 32, 3, 62],\n", " [76, 72, 79, 71, 86, 3, 32, 3, 62, 83],\n", " [72, 79, 71, 86, 3, 32, 3, 62, 83, 68],\n", " [79, 71, 86, 3, 32, 3, 62, 83, 68, 17],\n", " [71, 86, 3, 32, 3, 62, 83, 68, 17, 73],\n", " [86, 3, 32, 3, 62, 83, 68, 17, 73, 76],\n", " [3, 32, 3, 62, 83, 68, 17, 73, 76, 72],\n", " [32, 3, 62, 83, 68, 17, 73, 76, 72, 79],\n", " [3, 62, 83, 68, 17, 73, 76, 72, 79, 71],\n", " [62, 83, 68, 17, 73, 76, 72, 79, 71, 11],\n", " [83, 68, 17, 73, 76, 72, 79, 71, 11, 73],\n", " [68, 17, 73, 76, 72, 79, 71, 11, 73, 76],\n", " [17, 73, 76, 72, 79, 71, 11, 73, 76, 72],\n", " [73, 76, 72, 79, 71, 11, 73, 76, 72, 79],\n", " [76, 72, 79, 71, 11, 73, 76, 72, 79, 71],\n", " [72, 79, 71, 11, 73, 76, 72, 79, 71, 17],\n", " [79, 71, 11, 73, 76, 72, 79, 71, 17, 81],\n", " [71, 11, 73, 76, 72, 79, 71, 17, 81, 68],\n", " [11, 73, 76, 72, 79, 71, 17, 81, 68, 80],\n", " [73, 76, 72, 79, 71, 17, 81, 68, 80, 72],\n", " [76, 72, 79, 71, 17, 81, 68, 80, 72, 15],\n", " [72, 79, 71, 17, 81, 68, 80, 72, 15, 3],\n", " [79, 71, 17, 81, 68, 80, 72, 15, 3, 87],\n", " [71, 17, 81, 68, 80, 72, 15, 3, 87, 82],\n", " [17, 81, 68, 80, 72, 15, 3, 87, 82, 66],\n", " [81, 68, 80, 72, 15, 3, 87, 82, 66, 68],\n", " [68, 80, 72, 15, 3, 87, 82, 66, 68, 85],\n", " [80, 72, 15, 3, 87, 82, 66, 68, 85, 85],\n", " [72, 15, 3, 87, 82, 66, 68, 85, 85, 82],\n", " [15, 3, 87, 82, 66, 68, 85, 85, 82, 90],\n", " [3, 87, 82, 66, 68, 85, 85, 82, 90, 66],\n", " [87, 82, 66, 68, 85, 85, 82, 90, 66, 87],\n", " [82, 66, 68, 85, 85, 82, 90, 66, 87, 92],\n", " [66, 68, 85, 85, 82, 90, 66, 87, 92, 83],\n", " [68, 85, 85, 82, 90, 66, 87, 92, 83, 72],\n", " [85, 85, 82, 90, 66, 87, 92, 83, 72, 11],\n", " [85, 82, 90, 66, 87, 92, 83, 72, 11, 73],\n", " [82, 90, 66, 87, 92, 83, 72, 11, 73, 76],\n", " [90, 66, 87, 92, 83, 72, 11, 73, 76, 72],\n", " [66, 87, 92, 83, 72, 11, 73, 76, 72, 79],\n", " [87, 92, 83, 72, 11, 73, 76, 72, 79, 71],\n", " [92, 83, 72, 11, 73, 76, 72, 79, 71, 17],\n", " [83, 72, 11, 73, 76, 72, 79, 71, 17, 71],\n", " [72, 11, 73, 76, 72, 79, 71, 17, 71, 68],\n", " [11, 73, 76, 72, 79, 71, 17, 71, 68, 87],\n", " [73, 76, 72, 79, 71, 17, 71, 68, 87, 68],\n", " [76, 72, 79, 71, 17, 71, 68, 87, 68, 55],\n", " [72, 79, 71, 17, 71, 68, 87, 68, 55, 92],\n", " [79, 71, 17, 71, 68, 87, 68, 55, 92, 83],\n", " [71, 17, 71, 68, 87, 68, 55, 92, 83, 72],\n", " [17, 71, 68, 87, 68, 55, 92, 83, 72, 12],\n", " [71, 68, 87, 68, 55, 92, 83, 72, 12, 15],\n", " [68, 87, 68, 55, 92, 83, 72, 12, 15, 3],\n", " [87, 68, 55, 92, 83, 72, 12, 15, 3, 81],\n", " [68, 55, 92, 83, 72, 12, 15, 3, 81, 88],\n", " [55, 92, 83, 72, 12, 15, 3, 81, 88, 79],\n", " [92, 83, 72, 12, 15, 3, 81, 88, 79, 79],\n", " [83, 72, 12, 15, 3, 81, 88, 79, 79, 68],\n", " [72, 12, 15, 3, 81, 88, 79, 79, 68, 69],\n", " [12, 15, 3, 81, 88, 79, 79, 68, 69, 79],\n", " [15, 3, 81, 88, 79, 79, 68, 69, 79, 72],\n", " [3, 81, 88, 79, 79, 68, 69, 79, 72, 32],\n", " [81, 88, 79, 79, 68, 69, 79, 72, 32, 73],\n", " [88, 79, 79, 68, 69, 79, 72, 32, 73, 76],\n", " [79, 79, 68, 69, 79, 72, 32, 73, 76, 72],\n", " [79, 68, 69, 79, 72, 32, 73, 76, 72, 79],\n", " [68, 69, 79, 72, 32, 73, 76, 72, 79, 71],\n", " [69, 79, 72, 32, 73, 76, 72, 79, 71, 17],\n", " [79, 72, 32, 73, 76, 72, 79, 71, 17, 81],\n", " [72, 32, 73, 76, 72, 79, 71, 17, 81, 88],\n", " [32, 73, 76, 72, 79, 71, 17, 81, 88, 79],\n", " [73, 76, 72, 79, 71, 17, 81, 88, 79, 79],\n", " [76, 72, 79, 71, 17, 81, 88, 79, 79, 68],\n", " [72, 79, 71, 17, 81, 88, 79, 79, 68, 69],\n", " [79, 71, 17, 81, 88, 79, 79, 68, 69, 79],\n", " [71, 17, 81, 88, 79, 79, 68, 69, 79, 72],\n", " [17, 81, 88, 79, 79, 68, 69, 79, 72, 12],\n", " [81, 88, 79, 79, 68, 69, 79, 72, 12, 2],\n", " [88, 79, 79, 68, 69, 79, 72, 12, 2, 3],\n", " [79, 79, 68, 69, 79, 72, 12, 2, 3, 3],\n", " [79, 68, 69, 79, 72, 12, 2, 3, 3, 3],\n", " [68, 69, 79, 72, 12, 2, 3, 3, 3, 3],\n", " [69, 79, 72, 12, 2, 3, 3, 3, 3, 3],\n", " [79, 72, 12, 2, 3, 3, 3, 3, 3, 3],\n", " [72, 12, 2, 3, 3, 3, 3, 3, 3, 3],\n", " [12, 2, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [2, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 3],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 3, 73],\n", " [3, 3, 3, 3, 3, 3, 3, 3, 73, 82],\n", " [3, 3, 3, 3, 3, 3, 3, 73, 82, 85],\n", " [3, 3, 3, 3, 3, 3, 73, 82, 85, 3],\n", " [3, 3, 3, 3, 3, 73, 82, 85, 3, 73],\n", " [3, 3, 3, 3, 73, 82, 85, 3, 73, 76],\n", " [3, 3, 3, 73, 82, 85, 3, 73, 76, 72],\n", " [3, 3, 73, 82, 85, 3, 73, 76, 72, 79],\n", " [3, 73, 82, 85, 3, 73, 76, 72, 79, 71],\n", " [73, 82, 85, 3, 73, 76, 72, 79, 71, 3],\n", " [82, 85, 3, 73, 76, 72, 79, 71, 3, 76],\n", " [85, 3, 73, 76, 72, 79, 71, 3, 76, 81],\n", " [3, 73, 76, 72, 79, 71, 3, 76, 81, 3],\n", " [73, 76, 72, 79, 71, 3, 76, 81, 3, 86],\n", " [76, 72, 79, 71, 3, 76, 81, 3, 86, 70],\n", " [72, 79, 71, 3, 76, 81, 3, 86, 70, 75],\n", " [79, 71, 3, 76, 81, 3, 86, 70, 75, 72],\n", " [71, 3, 76, 81, 3, 86, 70, 75, 72, 80],\n", " [3, 76, 81, 3, 86, 70, 75, 72, 80, 68],\n", " [76, 81, 3, 86, 70, 75, 72, 80, 68, 64],\n", " [81, 3, 86, 70, 75, 72, 80, 68, 64, 2],\n", " [3, 86, 70, 75, 72, 80, 68, 64, 2, 3],\n", " [86, 70, 75, 72, 80, 68, 64, 2, 3, 3],\n", " [70, 75, 72, 80, 68, 64, 2, 3, 3, 3],\n", " [75, 72, 80, 68, 64, 2, 3, 3, 3, 3],\n", " [72, 80, 68, 64, 2, 3, 3, 3, 3, 85],\n", " [80, 68, 64, 2, 3, 3, 3, 3, 85, 72],\n", " [68, 64, 2, 3, 3, 3, 3, 85, 72, 87],\n", " [64, 2, 3, 3, 3, 3, 85, 72, 87, 88],\n", " [2, 3, 3, 3, 3, 85, 72, 87, 88, 85],\n", " [3, 3, 3, 3, 85, 72, 87, 88, 85, 81],\n", " [3, 3, 3, 85, 72, 87, 88, 85, 81, 3],\n", " [3, 3, 85, 72, 87, 88, 85, 81, 3, 83],\n", " [3, 85, 72, 87, 88, 85, 81, 3, 83, 68],\n", " [85, 72, 87, 88, 85, 81, 3, 83, 68, 17],\n", " [72, 87, 88, 85, 81, 3, 83, 68, 17, 86],\n", " [87, 88, 85, 81, 3, 83, 68, 17, 86, 70],\n", " [88, 85, 81, 3, 83, 68, 17, 86, 70, 75],\n", " [85, 81, 3, 83, 68, 17, 86, 70, 75, 72],\n", " [81, 3, 83, 68, 17, 86, 70, 75, 72, 80],\n", " [3, 83, 68, 17, 86, 70, 75, 72, 80, 68],\n", " [83, 68, 17, 86, 70, 75, 72, 80, 68, 11],\n", " [68, 17, 86, 70, 75, 72, 80, 68, 11, 73],\n", " [17, 86, 70, 75, 72, 80, 68, 11, 73, 76],\n", " [86, 70, 75, 72, 80, 68, 11, 73, 76, 72],\n", " [70, 75, 72, 80, 68, 11, 73, 76, 72, 79],\n", " [75, 72, 80, 68, 11, 73, 76, 72, 79, 71],\n", " [72, 80, 68, 11, 73, 76, 72, 79, 71, 86],\n", " [80, 68, 11, 73, 76, 72, 79, 71, 86, 12]],\n", " 'labels': [71,\n", " 72,\n", " 73,\n", " 3,\n", " 87,\n", " 82,\n", " 66,\n", " 68,\n", " 85,\n", " 85,\n", " 82,\n", " 90,\n", " 66,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 11,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 12,\n", " 29,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 5,\n", " 5,\n", " 5,\n", " 3,\n", " 38,\n", " 82,\n", " 81,\n", " 89,\n", " 72,\n", " 85,\n", " 87,\n", " 3,\n", " 68,\n", " 3,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 3,\n", " 73,\n", " 85,\n", " 82,\n", " 80,\n", " 3,\n", " 54,\n", " 83,\n", " 68,\n", " 85,\n", " 78,\n", " 3,\n", " 87,\n", " 82,\n", " 3,\n", " 36,\n", " 85,\n", " 85,\n", " 82,\n", " 90,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 5,\n", " 5,\n", " 5,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 76,\n", " 80,\n", " 83,\n", " 82,\n", " 85,\n", " 87,\n", " 3,\n", " 83,\n", " 92,\n", " 68,\n", " 85,\n", " 85,\n", " 82,\n", " 90,\n", " 3,\n", " 68,\n", " 86,\n", " 3,\n", " 83,\n", " 68,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 86,\n", " 3,\n", " 32,\n", " 3,\n", " 62,\n", " 83,\n", " 68,\n", " 17,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 11,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 17,\n", " 81,\n", " 68,\n", " 80,\n", " 72,\n", " 15,\n", " 3,\n", " 87,\n", " 82,\n", " 66,\n", " 68,\n", " 85,\n", " 85,\n", " 82,\n", " 90,\n", " 66,\n", " 87,\n", " 92,\n", " 83,\n", " 72,\n", " 11,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 17,\n", " 71,\n", " 68,\n", " 87,\n", " 68,\n", " 55,\n", " 92,\n", " 83,\n", " 72,\n", " 12,\n", " 15,\n", " 3,\n", " 81,\n", " 88,\n", " 79,\n", " 79,\n", " 68,\n", " 69,\n", " 79,\n", " 72,\n", " 32,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 17,\n", " 81,\n", " 88,\n", " 79,\n", " 79,\n", " 68,\n", " 69,\n", " 79,\n", " 72,\n", " 12,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 73,\n", " 82,\n", " 85,\n", " 3,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 3,\n", " 76,\n", " 81,\n", " 3,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 64,\n", " 2,\n", " 3,\n", " 3,\n", " 3,\n", " 3,\n", " 85,\n", " 72,\n", " 87,\n", " 88,\n", " 85,\n", " 81,\n", " 3,\n", " 83,\n", " 68,\n", " 17,\n", " 86,\n", " 70,\n", " 75,\n", " 72,\n", " 80,\n", " 68,\n", " 11,\n", " 73,\n", " 76,\n", " 72,\n", " 79,\n", " 71,\n", " 86,\n", " 12,\n", " 1]}" ] }, "execution_count": 34, "metadata": {}, "output_type": "execute_result" } ], "source": [ "process(datasets[8: 9], tokenizer)" ] }, { "cell_type": "code", "execution_count": 43, "metadata": { "id": "K2mgI6fZIdHD" }, "outputs": [], "source": [ "# 将数据分为训练集和测试集\n", "tokenized = datasets.train_test_split(test_size=0.1, seed=1024, shuffle=True)" ] }, { "cell_type": "code", "execution_count": 44, "metadata": { "id": "DthlmdhILLou" }, "outputs": [], "source": [ "f = lambda x: process(x, tokenizer)\n", "tokenized = tokenized.map(f, batched=True, remove_columns=datasets.column_names)\n", "tokenized.set_format(type='torch', device=device)" ] }, { "cell_type": "code", "execution_count": 47, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "w5tMPpYxLTDH", "outputId": "cbf5ffc0-1d89-4b6d-fc3c-513c64a598a5" }, "outputs": [ { "data": { "text/plain": [ "(torch.Size([645401, 10]), torch.Size([645401]))" ] }, "execution_count": 47, "metadata": {}, "output_type": "execute_result" } ], "source": [ "tokenized['train']['inputs'].shape, tokenized['train']['labels'].shape" ] }, { "cell_type": "code", "execution_count": 49, "metadata": { "id": "vDHUFgRZLXyQ" }, "outputs": [], "source": [ "train_loader = DataLoader(tokenized['train'], batch_size=batch_size, shuffle=True)\n", "test_loader = DataLoader(tokenized['test'], batch_size=batch_size, shuffle=True)" ] }, { "cell_type": "code", "execution_count": 50, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "ty-8deY9MKYc", "outputId": "ac08de19-5e46-438f-fbc6-489b10e7af90" }, "outputs": [ { "data": { "text/plain": [ "{'inputs': tensor([[ 2, 3, 3, ..., 3, 3, 85],\n", " [72, 87, 36, ..., 72, 81, 87],\n", " [68, 81, 3, ..., 3, 93, 76],\n", " ...,\n", " [ 3, 3, 3, ..., 33, 33, 3],\n", " [80, 51, 68, ..., 76, 82, 81],\n", " [ 5, 2, 3, ..., 82, 88, 81]], device='cuda:0'),\n", " 'labels': tensor([72, 86, 83, 88, 72, 3, 3, 3, 38, 82, 82, 3, 87, 73, 3, 81, 54, 3,\n", " 12, 92, 39, 72, 87, 79, 83, 16, 3, 3, 29, 76, 3, 70, 88, 80, 81, 12,\n", " 5, 72, 26, 86, 17, 85, 3, 2, 3, 70, 3, 85, 2, 72, 69, 17, 80, 68,\n", " 76, 11, 15, 3, 76, 87, 3, 68, 2, 3, 38, 70, 81, 51, 87, 16, 3, 71,\n", " 5, 87, 3, 3, 85, 78, 3, 72, 3, 72, 72, 87, 81, 66, 15, 3, 87, 76,\n", " 2, 3, 2, 80, 72, 89, 75, 87, 85, 17, 72, 49, 72, 85, 87, 3, 86, 76,\n", " 72, 3, 2, 85, 1, 3, 3, 3, 3, 3, 82, 3, 3, 72, 3, 68, 3, 3,\n", " 3, 11, 33, 3, 81, 38, 70, 3, 72, 66, 81, 67, 92, 3, 79, 86, 3, 64,\n", " 85, 3, 82, 16, 89, 73, 73, 82, 71, 29, 72, 87, 75, 68, 14, 71, 75, 72,\n", " 85, 72, 72, 72, 72, 72, 3, 86, 3, 85, 71, 3, 3, 3, 82, 15, 74, 79,\n", " 82, 17, 89, 62, 11, 76, 3, 3, 79, 66, 80, 2, 3, 32, 80, 3, 12, 11,\n", " 3, 3, 85, 73, 3, 76, 3, 38, 3, 3, 15, 91, 3, 72, 68, 3, 81, 11,\n", " 10, 32, 86, 3, 72, 87, 76, 3, 17, 3, 2, 3, 2, 72, 3, 87, 20, 84,\n", " 68, 39, 87, 2, 86, 72, 44, 12, 87, 85, 3, 17, 58, 3, 16, 92, 85, 3,\n", " 72, 88, 3, 3, 3, 36, 72, 72, 72, 3, 85, 3, 3, 86, 86, 3, 87, 3,\n", " 72, 83, 5, 68, 79, 82, 81, 3, 76, 82, 29, 3, 15, 12, 85, 20, 87, 87,\n", " 68, 72, 25, 80, 86, 73, 76, 70, 40, 85, 10, 3, 3, 73, 72, 2, 3, 12,\n", " 73, 3, 3, 2, 79, 83, 86, 94, 81, 72, 3, 86, 5, 3, 73, 3, 15, 59,\n", " 82, 12, 75, 73, 71, 3, 81, 3, 85, 1, 73, 3, 3, 71, 70, 3, 66, 76,\n", " 3, 68, 29, 86, 3, 3, 64, 74, 87, 76, 87, 72, 85, 76, 3, 3, 3, 68,\n", " 80, 19, 82, 3, 39, 72, 76, 19, 3, 33, 12, 3, 33, 73, 89, 3, 68, 3,\n", " 5, 11, 44, 83, 86, 87, 85, 17, 79, 71, 3, 3, 3, 11, 3, 3, 3, 76,\n", " 85, 80, 3, 3, 72, 3, 67, 3, 16, 3, 17, 2, 2, 87, 3, 3, 3, 87,\n", " 82, 87, 82, 3, 3, 3, 20, 2, 86, 88, 68, 86, 73, 82, 12, 85, 76, 3,\n", " 11, 76, 5, 72, 72, 3, 90, 66, 3, 3, 76, 83, 3, 2, 81, 75, 71, 83,\n", " 68, 6, 68, 3, 86, 53, 3, 72, 66, 33, 88, 79, 83, 72, 85, 75, 87, 55,\n", " 76, 3, 92, 3, 3, 29, 80, 3, 87, 72, 79, 3, 10, 5, 71, 85, 3, 85,\n", " 68, 3, 82, 3, 81, 76, 66, 3, 33, 16, 76, 3, 3, 64, 75, 2, 72, 71,\n", " 76, 3, 3, 3, 72, 71, 3, 86, 82, 3, 69, 72, 44, 3, 79, 82, 83, 3,\n", " 2, 71, 76, 3, 3, 69, 81, 3, 3, 76, 15, 3, 74, 2, 17, 87, 71, 67,\n", " 85, 68, 72, 3, 3, 93, 79, 79, 57, 56, 72, 82, 87, 83, 29, 5, 3, 3,\n", " 68, 3, 83, 51, 71, 72, 95, 82, 68, 3, 3, 17, 87, 3, 85, 68, 32, 82,\n", " 3, 88, 2, 82, 3, 87, 81, 68, 3, 38, 80, 76, 3, 33, 86, 3, 3, 92,\n", " 39, 3, 76, 76, 87, 88, 32, 88, 3, 72, 3, 3, 72, 3, 3, 3, 72, 82,\n", " 82, 3, 3, 83, 2, 62, 82, 82, 17, 74, 3, 87, 15, 3, 80, 2, 72, 87,\n", " 3, 72, 86, 3, 72, 17, 3, 92, 82, 3, 80, 91, 87, 88, 85, 3, 82, 33,\n", " 3, 2, 87, 76, 72, 2, 3, 85, 12, 76, 68, 81, 3, 3, 76, 3, 73, 82,\n", " 3, 3, 86, 3, 3, 85, 68, 73, 86, 3, 3, 3, 82, 3, 68, 87, 86, 72,\n", " 72, 53, 3, 72, 81, 23, 68, 86, 87, 86, 71, 20, 3, 3, 76, 3, 3, 39,\n", " 69, 72, 68, 3, 68, 68, 41, 85, 82, 85, 23, 23, 3, 29, 3, 51, 78, 3,\n", " 3, 29, 3, 70, 80, 3, 58, 3, 3, 87, 82, 88, 51, 72, 76, 3, 87, 86,\n", " 66, 3, 85, 32, 72, 72, 3, 3, 3, 82, 33, 49, 2, 82, 79, 53, 71, 80,\n", " 80, 86, 66, 72, 89, 10, 3, 3, 33, 70, 3, 3, 68, 85, 72, 29, 3, 68,\n", " 66, 5, 3, 3, 3, 72, 88, 75, 70, 82, 5, 15, 82, 16, 76, 3, 14, 86,\n", " 72, 87, 3, 3, 3, 17, 3, 56, 3, 3, 68, 3, 3, 12, 79, 81, 3, 73,\n", " 33, 3, 66, 76, 29, 5, 71, 3, 89, 2, 74, 3, 81, 3, 66, 68, 3, 11,\n", " 82, 3, 80, 82, 81, 3, 87, 83, 3, 92, 70, 3, 86, 87, 3, 92, 3, 12,\n", " 3, 3, 72, 3, 3, 3, 71, 17, 95, 85, 87, 3, 20, 69, 68, 82, 12, 83,\n", " 86, 72, 68, 41, 81, 79, 75, 3, 3, 24, 3, 72, 3, 80, 86, 85, 82, 70,\n", " 3, 85, 81, 87, 17, 3, 14, 87, 15, 3, 72, 20, 47, 86, 68, 3, 3, 3,\n", " 85, 41, 16, 87, 73, 20, 3, 68, 74, 3, 72, 83, 56, 11, 20, 80, 76, 64,\n", " 64, 3, 80, 77, 86, 3, 40, 3, 73, 3, 55, 10, 71, 11, 12, 72, 83, 85,\n", " 3, 81, 82, 3, 86, 66, 87, 3, 92, 3, 72, 79, 3, 72, 82, 38, 80, 3,\n", " 71, 72, 83, 3, 66, 87, 85, 79, 71, 3, 87, 87, 90, 75, 53, 5, 3, 76,\n", " 76, 29, 17, 75, 3, 33, 3, 75, 72, 80, 3, 3, 72, 72, 5, 48, 3, 3,\n", " 85, 3, 68, 89, 3, 8, 10, 85, 86, 71], device='cuda:0')}" ] }, "execution_count": 50, "metadata": {}, "output_type": "execute_result" } ], "source": [ "next(iter(train_loader))" ] }, { "cell_type": "code", "execution_count": 52, "metadata": { "id": "aAaBn0NHNvzq" }, "outputs": [], "source": [ "class CharMLP(nn.Module):\n", "\n", " def __init__(self, vs):\n", " # vs 字典大小\n", " super().__init__()\n", " self.emb = nn.Embedding(vs, 30)\n", " self.hidden1 = nn.Linear(10 * 30, 200)\n", " self.hidden2 = nn.Linear(200, 100)\n", " self.lm = nn.Linear(100, vs)\n", "\n", " def forward(self, x):\n", " # x: (B, 10)\n", " B = x.shape[0]\n", " emb = self.emb(x) # (B, 10, 30)\n", " h = emb.view(B, -1) # (B, 300)\n", " h = F.relu(self.hidden1(h)) # (B, 200)\n", " h = F.relu(self.hidden2(h)) # (B, 100)\n", " out = self.lm(h) # (B, vs)\n", " return out" ] }, { "cell_type": "code", "execution_count": 53, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "O8QEEixcN3-y", "outputId": "75d4b222-d519-41ed-ac6a-f0a50f11b867" }, "outputs": [ { "data": { "text/plain": [ "CharMLP(\n", " (emb): Embedding(99, 30)\n", " (hidden1): Linear(in_features=300, out_features=200, bias=True)\n", " (hidden2): Linear(in_features=200, out_features=100, bias=True)\n", " (lm): Linear(in_features=100, out_features=99, bias=True)\n", ")" ] }, "execution_count": 53, "metadata": {}, "output_type": "execute_result" } ], "source": [ "model = CharMLP(len(tokenizer.char2ind)).to(device)\n", "model" ] }, { "cell_type": "code", "execution_count": 54, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "eBwttuD0OFAp", "outputId": "744e8005-428b-438b-8a9e-8dd04e9c24a8" }, "outputs": [ { "data": { "text/plain": [ "{'train': 4.5956830978393555, 'test': 4.594418525695801}" ] }, "execution_count": 54, "metadata": {}, "output_type": "execute_result" } ], "source": [ "def estimate_loss(model):\n", " re = {}\n", " # 将模型切换至评估模式\n", " model.eval()\n", " re['train'] = _loss(model, train_loader)\n", " re['test'] = _loss(model, test_loader)\n", " # 将模型切换至训练模式\n", " model.train()\n", " return re\n", "\n", "@torch.no_grad()\n", "def _loss(model, data_loader):\n", " \"\"\"\n", " 计算模型在不同数据集下面的评估指标\n", " \"\"\"\n", " loss = []\n", " data_iter= iter(data_loader)\n", " # 随机使用多个批量数据来预估模型效果\n", " for k in range(eval_iters):\n", " data = next(data_iter, None)\n", " if data is None:\n", " data_iter = iter(data_loader)\n", " data = next(data_iter, None)\n", " inputs, labels = data['inputs'], data['labels']\n", " logits = model(inputs)\n", " loss.append(F.cross_entropy(logits, labels).item())\n", " return torch.tensor(loss).mean().item()\n", "\n", "estimate_loss(model)" ] }, { "cell_type": "code", "execution_count": 55, "metadata": { "id": "VClmDyIBORwH" }, "outputs": [], "source": [ "def train_model(model, optimizer, epochs=10):\n", " # 记录模型在训练集上的模型损失\n", " lossi = []\n", " for epoch in range(epochs):\n", " for i, data in enumerate(train_loader, 0):\n", " inputs, labels = data['inputs'], data['labels']\n", " optimizer.zero_grad()\n", " logits = model(inputs)\n", " loss = F.cross_entropy(logits, labels)\n", " lossi.append(loss.item())\n", " loss.backward()\n", " optimizer.step()\n", " # 评估模型,并输出结果\n", " stats = estimate_loss(model)\n", " train_loss = f'train loss {stats[\"train\"]:.4f}'\n", " test_loss = f'test loss {stats[\"test\"]:.4f}'\n", " print(f'epoch {epoch:>2}: {train_loss}, {test_loss}')\n", " return lossi" ] }, { "cell_type": "code", "execution_count": 56, "metadata": { "id": "tjVqfYGYOZbI" }, "outputs": [], "source": [ "@torch.no_grad()\n", "def generate(model, context, tokenizer, max_new_tokens=300):\n", " # context: (1, 10)\n", " out = []\n", " model.eval()\n", " for _ in range(max_new_tokens):\n", " logits = model(context) # (1, 99)\n", " probs = F.softmax(logits, dim=-1) # (1, 99)\n", " # 随机生成文本\n", " ix = torch.multinomial(probs, num_samples=1) # (1, 1)\n", " # 更新背景\n", " context = torch.concat((context[:, 1:], ix), dim=-1)\n", " out.append(ix.item())\n", " if out[-1] == tokenizer.end_ind:\n", " break\n", " model.train()\n", " return out" ] }, { "cell_type": "code", "execution_count": 58, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "JqqwjlWKQFU6", "outputId": "f0b8c0be-1b72-41dc-c3a5-94cf48b4f16c" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "bcsLg]C@00yb<|b|>C?)M^)!iHST24GbhFOX%-Pi (^`^F:^7y\\ '`\"7o\n" ] } ], "source": [ "context = torch.zeros((1, 10), dtype=torch.long, device=device)\n", "print(''.join(tokenizer.decode(generate(model, context, tokenizer))))" ] }, { "cell_type": "code", "execution_count": 59, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "qMnzyCY8Qt0k", "outputId": "2ced7bd4-872f-4b02-ed7c-d854191ec368" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "epoch 0: train loss 1.3770, test loss 1.5173\n", "epoch 1: train loss 1.2562, test loss 1.4910\n", "epoch 2: train loss 1.2012, test loss 1.4271\n", "epoch 3: train loss 1.1598, test loss 1.4003\n", "epoch 4: train loss 1.1460, test loss 1.3597\n", "epoch 5: train loss 1.1409, test loss 1.3340\n", "epoch 6: train loss 1.0796, test loss 1.3965\n", "epoch 7: train loss 1.0876, test loss 1.3648\n", "epoch 8: train loss 1.0685, test loss 1.3592\n", "epoch 9: train loss 1.0921, test loss 1.3188\n" ] } ], "source": [ "l = train_model(model, optim.Adam(model.parameters(), lr=learning_rate))" ] }, { "cell_type": "code", "execution_count": 60, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "Pqy54pyIRD0D", "outputId": "d0376b01-92a2-4d26-c510-711d8d2e4604" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "def chars_s[numNote.Sprechosk(pirt franBy.\n", " name = minvalue; 6Labele(ible str.s))\n", " return checkpointWithRand.\n", " raise ValueError:\n", " `DataFrame().collect()\n", " elif type(frectis).) by wrapped whorhate\n", " TypeError(\"andhartini\n" ] } ], "source": [ "context = torch.zeros((1, 10), dtype=torch.long, device=device)\n", "print(''.join(tokenizer.decode(generate(model, context, tokenizer))))" ] }, { "cell_type": "code", "execution_count": 61, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 448 }, "id": "fTEO7oANR1hd", "outputId": "ea08c382-8e8d-45f9-dc7d-7dc8f843df0e" }, "outputs": [ { "data": { "text/plain": [ "[]" ] }, "execution_count": 61, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "plt.plot(torch.tensor(l).view(-1, 10).mean(dim=-1))" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "id": "hGpepZO7SHdY" }, "outputs": [], "source": [] } ], "metadata": { "accelerator": "GPU", "colab": { "gpuType": "T4", "provenance": [] }, "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.8.5" }, "widgets": { "application/vnd.jupyter.widget-state+json": { "00bb3ff456444b0397816f21490a90f2": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "08ac8d7ac893490f8cd625568cf4e5d1": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "08d8c742014645279744eff2763845bd": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "09da2bb790a54c179f481d531d3405eb": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_179ba1b4b8b24b9eadc81a645ed702c8", "max": 412178, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_1d61f57335364ca0b02a0bd32b56fec6", "value": 412178 } }, "0dc5926e3ba0499a918a1c3cbfe862f3": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_e2feea769fc14391bb944122c2e808e1", "placeholder": "​", "style": "IPY_MODEL_5cb0d5f4438749eb9f24fe4aa50ab6b7", "value": "Downloading builder script: 100%" } }, "142b9dcdc4514ea684c2d0522746e0af": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "179ba1b4b8b24b9eadc81a645ed702c8": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "1b5de35016af4f5686c1a09c3bcf88cd": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "1d61f57335364ca0b02a0bd32b56fec6": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "2387b751d5d6472d8d8f8e7c030338af": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "23f6fe5d77c647c5b2c546b82b03667b": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "25e19856014d44c9b762cd7a1f8dc319": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4ab8ec295f644193b088d95a3a9b3ec5", "max": 940909997, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_3298fe74f69146bbbbe364c2c4fe5332", "value": 940909997 } }, "26dfd6520e8049038e69114766b9a0ff": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a60bb837834b44378e178e4d9b1a52d4", "placeholder": "​", "style": "IPY_MODEL_b70d024a38864d6bb557bff17ae95d88", "value": "Downloading readme: 100%" } }, "2bed0a97406e46b9bf1c07e66be77dd5": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_0dc5926e3ba0499a918a1c3cbfe862f3", "IPY_MODEL_b704286c3f2c4fa7bcbbc6e6d4b57fb6", "IPY_MODEL_49c33407cf8649bd95f63cf1ee22751b" ], "layout": "IPY_MODEL_e62ac2ea2f8448ee8232dd70eb9850d8" } }, "2c794c7d98024cbdb38a1ec3e5ccb31a": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "3298fe74f69146bbbbe364c2c4fe5332": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "3742bf06e2f540fb9d8786d7d2c8f317": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "393fa623e36f4be992837c4d901fa23e": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7a9fb712ced44bf5bc48a4d53c60eeb5", "placeholder": "​", "style": "IPY_MODEL_deb24f274ab3445eb1d02106a6d6e9cf", "value": "Filter: 100%" } }, "39cc1628e42a4ecebe1e7541416a388d": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_53b2163f134f4f9ca0fed9fbc431a4ec", "placeholder": "​", "style": "IPY_MODEL_08d8c742014645279744eff2763845bd", "value": " 412178/412178 [00:58<00:00, 5000.54 examples/s]" } }, "3c5b9b565db14586a40a4a8e54ebe7d3": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "3f3463f177334349836d9cdc25fea796": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "49c33407cf8649bd95f63cf1ee22751b": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f5b190ba8db74c789b25bf8869d44f6b", "placeholder": "​", "style": "IPY_MODEL_5a4d6fbda05e45f4b78368d4f02c6c38", "value": " 8.44k/8.44k [00:00<00:00, 199kB/s]" } }, "4ab8ec295f644193b088d95a3a9b3ec5": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "4cbe13efb5dc40b0a7eebd9f7defffc6": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_b9b6cf9874544468879f3302cbafdd0f", "IPY_MODEL_09da2bb790a54c179f481d531d3405eb", "IPY_MODEL_d5965607686242799233b3d462319eed" ], "layout": "IPY_MODEL_2387b751d5d6472d8d8f8e7c030338af" } }, "4d2392c4d43142ca9b8d01b7b2ebb5fd": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "4d562acc0dcb490992a549f0d3504627": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "50b76f3d1f3b4bebab396b6bca23e48b": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "53b2163f134f4f9ca0fed9fbc431a4ec": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "5504bb59eb6e47f79d3b91d42db65911": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3c5b9b565db14586a40a4a8e54ebe7d3", "placeholder": "​", "style": "IPY_MODEL_89502573192842bd8070a3d3120da01b", "value": " 941M/941M [00:20<00:00, 67.3MB/s]" } }, "57706c85ad7a44f4927b7f4e9c6fca75": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_827d8054dfaa49edb71192929b9d6495", "placeholder": "​", "style": "IPY_MODEL_80e437bb9dab47b6b0f4892a21847349", "value": " 22176/22176 [00:10<00:00, 2649.71 examples/s]" } }, "5a4d6fbda05e45f4b78368d4f02c6c38": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "5cb0d5f4438749eb9f24fe4aa50ab6b7": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "5d410efac6014533bc1ba839a05d0aaa": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "6b7f47c502144cafb10942d2f1987e78": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "6c6403ef2e0f482599d0e54d58481f39": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_c5453de040db461dae54c65cfadb8d39", "placeholder": "​", "style": "IPY_MODEL_b0f0fc0e102a4acc995a8cc1641074d9", "value": " 12.9k/12.9k [00:00<00:00, 243kB/s]" } }, "6f9585f9022c4360bcc6b5610b33600a": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "77efb896627947cfa3bdf21f9414cb8a": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "7a9fb712ced44bf5bc48a4d53c60eeb5": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "7ab21750b1a0415d80f9f6f5aea4c13d": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_8ef34aff5e9f4096add539f7f6ae29f2", "IPY_MODEL_25e19856014d44c9b762cd7a1f8dc319", "IPY_MODEL_5504bb59eb6e47f79d3b91d42db65911" ], "layout": "IPY_MODEL_bab3bf9895a04dfdbdc76dc642311197" } }, "7c25ae55118e4ec7ae7bffc25a0ae43e": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_23f6fe5d77c647c5b2c546b82b03667b", "placeholder": "​", "style": "IPY_MODEL_82b0e10b205e48a8832bb8e8fbbb8160", "value": " 23107/23107 [00:11<00:00, 2744.81 examples/s]" } }, "7d2ec54cf30c495791e3a338b2168dd1": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "7d7c7114ff6041e7ae8b48624bba47fa": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "7dd2552a36ca4819a20c96cdbeed3e36": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_26dfd6520e8049038e69114766b9a0ff", "IPY_MODEL_bbbd5b6f8f44455faf0a031466b2702f", "IPY_MODEL_6c6403ef2e0f482599d0e54d58481f39" ], "layout": "IPY_MODEL_b35467fc4f9041fd9ce882eecd2a6021" } }, "80e437bb9dab47b6b0f4892a21847349": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "81a506124060495d9dc6b59eba2e2490": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "827d8054dfaa49edb71192929b9d6495": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "82b0e10b205e48a8832bb8e8fbbb8160": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "869716edc1fe4dcc99a8880d9033f773": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3742bf06e2f540fb9d8786d7d2c8f317", "max": 23107, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_f441707f8fad401883c1220b2e360ff4", "value": 23107 } }, "89502573192842bd8070a3d3120da01b": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "8ef34aff5e9f4096add539f7f6ae29f2": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a3cda732dbfb4a2f9768203548af20f5", "placeholder": "​", "style": "IPY_MODEL_77efb896627947cfa3bdf21f9414cb8a", "value": "Downloading data: 100%" } }, "8fa918d042164c879da4bd580192fdad": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_393fa623e36f4be992837c4d901fa23e", "IPY_MODEL_b79a434bbbd44b41b0c2c94d794858ca", "IPY_MODEL_39cc1628e42a4ecebe1e7541416a388d" ], "layout": "IPY_MODEL_c896952f04184bd29b9e796fe0bbfa42" } }, "94bfa0c5b77e4bd2b17ff94739b457fe": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "a245080a91284641900af30ffbb70577": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "a3cda732dbfb4a2f9768203548af20f5": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "a60bb837834b44378e178e4d9b1a52d4": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "afeb10d4301f44ae9728fc2ef77291a2": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_df2c621d9afd438482ea96e8803d56c7", "IPY_MODEL_d312591650f940e797746320007f3ef2", "IPY_MODEL_57706c85ad7a44f4927b7f4e9c6fca75" ], "layout": "IPY_MODEL_6f9585f9022c4360bcc6b5610b33600a" } }, "b0f0fc0e102a4acc995a8cc1641074d9": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "b35467fc4f9041fd9ce882eecd2a6021": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "b704286c3f2c4fa7bcbbc6e6d4b57fb6": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_a245080a91284641900af30ffbb70577", "max": 8440, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_1b5de35016af4f5686c1a09c3bcf88cd", "value": 8440 } }, "b70d024a38864d6bb557bff17ae95d88": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "b79a434bbbd44b41b0c2c94d794858ca": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_4d562acc0dcb490992a549f0d3504627", "max": 412178, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_7d2ec54cf30c495791e3a338b2168dd1", "value": 412178 } }, "b9b6cf9874544468879f3302cbafdd0f": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3f3463f177334349836d9cdc25fea796", "placeholder": "​", "style": "IPY_MODEL_142b9dcdc4514ea684c2d0522746e0af", "value": "Generating train split: 100%" } }, "bab3bf9895a04dfdbdc76dc642311197": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "bbbd5b6f8f44455faf0a031466b2702f": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_50b76f3d1f3b4bebab396b6bca23e48b", "max": 12909, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_5d410efac6014533bc1ba839a05d0aaa", "value": 12909 } }, "c5453de040db461dae54c65cfadb8d39": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "c896952f04184bd29b9e796fe0bbfa42": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "d312591650f940e797746320007f3ef2": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "FloatProgressModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7d7c7114ff6041e7ae8b48624bba47fa", "max": 22176, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_08ac8d7ac893490f8cd625568cf4e5d1", "value": 22176 } }, "d35c100aed8743efa1b0df5a7e89308c": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_81a506124060495d9dc6b59eba2e2490", "placeholder": "​", "style": "IPY_MODEL_2c794c7d98024cbdb38a1ec3e5ccb31a", "value": "Generating validation split: 100%" } }, "d5965607686242799233b3d462319eed": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6b7f47c502144cafb10942d2f1987e78", "placeholder": "​", "style": "IPY_MODEL_00bb3ff456444b0397816f21490a90f2", "value": " 412178/412178 [03:22<00:00, 2213.48 examples/s]" } }, "deb24f274ab3445eb1d02106a6d6e9cf": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "DescriptionStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "df2c621d9afd438482ea96e8803d56c7": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HTMLModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_f492252b9930497fb55837093a9d130f", "placeholder": "​", "style": "IPY_MODEL_94bfa0c5b77e4bd2b17ff94739b457fe", "value": "Generating test split: 100%" } }, "e2feea769fc14391bb944122c2e808e1": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "e62ac2ea2f8448ee8232dd70eb9850d8": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "f402ab9afaa24efda0494e78ba44b3cb": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "HBoxModel", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_d35c100aed8743efa1b0df5a7e89308c", "IPY_MODEL_869716edc1fe4dcc99a8880d9033f773", "IPY_MODEL_7c25ae55118e4ec7ae7bffc25a0ae43e" ], "layout": "IPY_MODEL_4d2392c4d43142ca9b8d01b7b2ebb5fd" } }, "f441707f8fad401883c1220b2e360ff4": { "model_module": "@jupyter-widgets/controls", "model_module_version": "1.5.0", "model_name": "ProgressStyleModel", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "f492252b9930497fb55837093a9d130f": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "f5b190ba8db74c789b25bf8869d44f6b": { "model_module": "@jupyter-widgets/base", "model_module_version": "1.2.0", "model_name": "LayoutModel", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } } } } }, "nbformat": 4, "nbformat_minor": 1 }