2023-06-18 18:22:31 +02:00
{
2023-06-18 22:44:55 +02:00
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "TVWZUBhyPfpa",
"outputId": "2a548af2-1981-4a46-b826-62b88ca08eb1"
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Requirement already satisfied: transformers in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (4.30.2)\n",
"Requirement already satisfied: torch in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (1.13.0)\n",
"Collecting accelerate\n",
" Downloading accelerate-0.20.3-py3-none-any.whl (227 kB)\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m227.6/227.6 kB\u001b[0m \u001b[31m3.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0ma \u001b[36m0:00:01\u001b[0m\n",
"\u001b[?25hRequirement already satisfied: filelock in /Users/adamwojdyla/.local/lib/python3.8/site-packages (from transformers) (3.9.0)\n",
"Requirement already satisfied: huggingface-hub<1.0,>=0.14.1 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from transformers) (0.15.1)\n",
"Requirement already satisfied: numpy>=1.17 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from transformers) (1.24.2)\n",
"Requirement already satisfied: packaging>=20.0 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from transformers) (23.1)\n",
"Requirement already satisfied: pyyaml>=5.1 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from transformers) (6.0)\n",
"Requirement already satisfied: regex!=2019.12.17 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from transformers) (2023.3.23)\n",
"Requirement already satisfied: requests in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from transformers) (2.28.2)\n",
"Requirement already satisfied: tokenizers!=0.11.3,<0.14,>=0.11.1 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from transformers) (0.13.3)\n",
"Requirement already satisfied: safetensors>=0.3.1 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from transformers) (0.3.1)\n",
"Requirement already satisfied: tqdm>=4.27 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from transformers) (4.65.0)\n",
"Requirement already satisfied: typing-extensions in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from torch) (4.6.3)\n",
"Requirement already satisfied: psutil in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from accelerate) (5.9.5)\n",
"Requirement already satisfied: fsspec in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from huggingface-hub<1.0,>=0.14.1->transformers) (2023.6.0)\n",
"Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from requests->transformers) (3.0.1)\n",
"Requirement already satisfied: idna<4,>=2.5 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from requests->transformers) (3.4)\n",
"Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from requests->transformers) (1.26.14)\n",
"Requirement already satisfied: certifi>=2017.4.17 in /usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages (from requests->transformers) (2022.12.7)\n",
"Installing collected packages: accelerate\n",
"Successfully installed accelerate-0.20.3\n",
"\n",
"\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.0\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m23.1.2\u001b[0m\n",
"\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n"
]
}
],
"source": [
"!pip install transformers torch accelerate"
]
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"cell_type": "markdown",
"metadata": {
"id": "xxbWwu3KSds-"
},
"source": [
"# Wczytanie bazowego modelu\n",
"Bazowym modelem jest polska wersja GPT2 https://huggingface.co/flax-community/papuGaPT2?text=Najsmaczniejszy+polski+owoc+to"
]
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"cell_type": "code",
"execution_count": 2,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 273,
"referenced_widgets": [
"ac800b679bdc4382b28cbcf9c68303f0",
"2fa8106d87594af283e5b74915003783",
"04e5f6b3190740dd85bedac661c67770",
"37c645ebeb934c8db572d4b4da63f280",
"4757bdb315e04fb982ac45e0a26a7c2d",
"f125275065c64b6ca55f0767737a488a",
"06b012d7bd5b418eb74d89ba51dbc690",
"7e3d164400b342c897b4e647da36a02e",
"eadd02efcb204b20b3bfd8e99cde9ae3",
"2264a5b9de1d4e93acbdbd84c3abf040",
"e863997d8ce142798230810e384323ba",
"c09398bd98554499805b5f14270e4248",
"c3b4b0254d8b4e4eb399ca3514d36211",
"8adaa113d54247388e1355331451926a",
"bbedc4f5cece4090ad997ce39d65e96a",
"825fd5e9a017439995c67dcb3a7736b9",
"bab30e40fedb43dc8e0044c80727c38b",
"ffdbfdfd24f3433f9653a3a0b1a177d6",
"fc1af3db81b243178157ee330f62ff3c",
"a46138f2b04c4418816fa264c3deb892",
"b47c3295784648cf8847e198ee33c615",
"ee47504dd7274dfb860a5c4355a37295",
"31ec83a1244d416ba8cfe922748b7e55",
"3d41103299d5441184b2890a8a52b6ec",
"01e1e799e775450694e2842d87bbc871",
"244faf9363794c0a86175f72fb63655f",
"14b26d9b078f4a919f09f8133e5dd22d",
"109145210ff64132a36601470b3e24e6",
"1eefecffe6124ad6b835ed579a0adfa5",
"b7b911c6bca94858bb93ffbcb1daa736",
"4b7636fbfe854056acadd394d71cde75",
"afc4c68e30a14d74b7c1547f02570baf",
"57763424d94a4384b4fa4c762062b6ba",
"3a9bbce5adf04b77beed6eb10211551f",
"9125492ba517409eb77722982d57b948",
"ff2160ef3ab14d4682cfbb1b878af62f",
"52d637c25ad84c6fae643fe7f687f63a",
"a87573424cf0463a85b56271931d6dc8",
"95dc4d80e12c4020bdd8f5d849107cf5",
"c1d658d5f21f4731895b397cc3fcb055",
"53f98231a2c140efbd0a1d2d25367b1f",
"367f3aae32ab4e1b9f67f3cd29299c5b",
"b6aa40c7501f44178f14ac88b63f57cb",
"984a17db21ee4aa898323ecde9c14f16",
"dc277586ba1f4eeda104c895cf9a1626",
"3b6bfbe260a9403c8216269b5032cde4",
"a7d258bfe8644c38a56ca365ea9e4ab1",
"0f75959ab6364a60b229051f0d5b2c68",
"ca47940201884085b556bbc7032f17f2",
"eb4e61e04bc04929be057a5a960feb9d",
"b7ef949a1eb0469fb0bd1be5256fa79a",
"f7687d83ee0149248610c40d4d86d944",
"bfa116bd3e144c15b67bd97ff3c85fea",
"7e58b084511e4232a0d197539306c57f",
"7e8ca657aedb41da9a99c3d3d648ea00",
"5cfa6f79da7e47639bfdea6d8f70dd7d",
"3530c50e41b54531b12d04c807d3924a",
"b6afee105c69499f98cf0544ffe325cb",
"3219d928e9e14e4ba95bf2aad70162a3",
"0853024b81894cc79c7f6b8de97c5c5b",
"59d4ec3a13844c878d4e95896a37121d",
"1498b932de1b4a5f922395ecf3b437a9",
"083cd7a3ebb34bbf8940af58359a4848",
"4e16ca13c2dd46069b65dd48f3da8790",
"98e047a8134f4502bb134beb26ffe821",
"ad3e29e3250a4323b715a7ffe279c799",
"5c71295523ea4561a6fe8534c0b160e2",
"c62c829fa4f346f4966f68e020c50813",
"f10ed53b98304b6197789308330e1bf8",
"9516994367bc488faeae786254eff8c7",
"f95ffcc1b9564519aa1f1c81e2d16dbf",
"e7fafc300aa749a2bedd750295731307",
"05032586bc4d4f8c9a1fa023695e60ec",
"7e56e3fd676440d0a23ca09f8b5c7d4e",
"855d7b31b1a44fb9b667e84f30bd121a",
"164ae1d73d4b461fb27c0401b8ce09fe",
"6e3c14738f864803b0f95cd940f23d9e",
"3ade165824644044bb922256c3773156",
"6c924e348934452887581e23151c7ebb",
"85a446e817c943c7a26e40a7ad8f511f",
"08c86037bfe442079bb79321147a73df",
"d3f1817bcb0a4e8a85e0515898c13850",
"2e154a9d0eeb45c38728084edb841a29",
"2a67736c8e3a481aa139b021a89140ab",
"6bb99699d0614c83b588a7dd65351c1c",
"f380816f81d046b880b12a429d624c2f",
"17b70c7ee49f477cacf15abe01d88905",
"7c0ca4701ce64754b5f31663458e925b"
]
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"id": "LdRQU2xnOrst",
"outputId": "414a875b-08d7-45f3-ae17-ef47a5fe3db3"
},
"outputs": [
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "12908d60c7114acf998fbb62a8d8641c",
"version_major": 2,
"version_minor": 0
},
"text/plain": [
"Downloading config.json: 0%| | 0.00/864 [00:00<?, ?B/s]"
]
},
"metadata": {},
"output_type": "display_data"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "5f4ada04bb734a51beaf2a93a622e423",
"version_major": 2,
"version_minor": 0
},
"text/plain": [
"Downloading pytorch_model.bin: 0%| | 0.00/510M [00:00<?, ?B/s]"
]
},
"metadata": {},
"output_type": "display_data"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "70e2466ff41a452e99d4e97054c32ae9",
"version_major": 2,
"version_minor": 0
},
"text/plain": [
"Downloading tokenizer_config.json: 0%| | 0.00/208 [00:00<?, ?B/s]"
]
},
"metadata": {},
"output_type": "display_data"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "35ac099b73244112a90948e2cf5e706e",
"version_major": 2,
"version_minor": 0
},
"text/plain": [
"Downloading vocab.json: 0%| | 0.00/888k [00:00<?, ?B/s]"
]
},
"metadata": {},
"output_type": "display_data"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "1e8068e6732242a39c913575ce6f99df",
"version_major": 2,
"version_minor": 0
},
"text/plain": [
"Downloading merges.txt: 0%| | 0.00/547k [00:00<?, ?B/s]"
]
},
"metadata": {},
"output_type": "display_data"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "817d5232bd7343a6ae3c25d8f3c98500",
"version_major": 2,
"version_minor": 0
},
"text/plain": [
"Downloading tokenizer.json: 0%| | 0.00/1.54M [00:00<?, ?B/s]"
]
},
"metadata": {},
"output_type": "display_data"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "f251ce84affe429dbce971b74c339398",
"version_major": 2,
"version_minor": 0
},
"text/plain": [
"Downloading added_tokens.json: 0%| | 0.00/24.0 [00:00<?, ?B/s]"
]
},
"metadata": {},
"output_type": "display_data"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"data": {
"application/vnd.jupyter.widget-view+json": {
"model_id": "707438f17b99435c9279e7cf9b404627",
"version_major": 2,
"version_minor": 0
},
"text/plain": [
"Downloading (…)cial_tokens_map.json: 0%| | 0.00/90.0 [00:00<?, ?B/s]"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"from transformers import AutoTokenizer, AutoModelForCausalLM, set_seed\n",
"import pandas as pd\n",
"\n",
"model = AutoModelForCausalLM.from_pretrained('flax-community/papuGaPT2')\n",
"tokenizer = AutoTokenizer.from_pretrained('flax-community/papuGaPT2')\n",
"\n",
"tokenizer.pad_token = tokenizer.eos_token"
]
},
{
"cell_type": "markdown",
"metadata": {
"id": "IY2e11OjS54T"
},
"source": [
"# Wczytanie danych do finetuningu\n",
"Dane stworzyliśmy ręcznie oraz za pomocą ChatGPT."
]
},
{
"cell_type": "markdown",
"metadata": {
"collapsed": false
},
"source": []
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"id": "tD7U4Qa5UhEf",
"outputId": "1f215c64-dd7f-4d3f-9e65-072aa2ddfab9"
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"question: Dlaczego w ogóle warto się starać?\n",
"answer: Nie warto. Wszystko i tak skończy się niepowodzeniem.\n"
]
}
],
"source": [
"data = pd.read_csv('prompts.csv', sep=';')\n",
"# data.head()\n",
"# data[\"answer\"]\n",
"texts = 'question: ' + data['question'] + \"\\nanswer: \" + data['answer']\n",
"texts = texts.tolist()\n",
"print(texts[0])"
]
},
{
"cell_type": "markdown",
"metadata": {
"id": "CQw_oCFyUnY_"
},
"source": [
"# Preprocessing"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {
"id": "_AYrfmfGXMEV"
},
"outputs": [],
"source": [
"from torch.utils.data import Dataset, DataLoader, random_split, RandomSampler, SequentialSampler\n",
"import torch\n",
"\n",
"# Create custom dataset\n",
"class PromptsDataset(Dataset):\n",
" def __init__(self, txt_list, tokenizer):\n",
" self.tokenizer = tokenizer\n",
" self.input_ids = []\n",
" self.attn_masks = []\n",
"\n",
" for txt in txt_list:\n",
" encodings_dict = tokenizer(txt, padding=\"max_length\", truncation=True, max_length=512)\n",
" self.input_ids.append(torch.tensor(encodings_dict['input_ids']))\n",
" self.attn_masks.append(torch.tensor(encodings_dict['attention_mask']))\n",
"\n",
" def __len__(self):\n",
" return len(self.input_ids)\n",
"\n",
" def __getitem__(self, idx):\n",
" return self.input_ids[idx], self.attn_masks[idx]"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"id": "yQp1opRYXPAv",
"outputId": "04a99a2d-d1c6-4216-b676-1197ba2cb781"
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
" 154 training samples\n",
" 18 validation samples\n"
]
}
],
"source": [
"# Create dataset\n",
"dataset = PromptsDataset(texts, tokenizer)\n",
"\n",
"# Split into training and validation sets\n",
"train_size = int(0.9 * len(dataset))\n",
"val_size = len(dataset) - train_size\n",
"\n",
"train_dataset, val_dataset = random_split(dataset, [train_size, val_size])\n",
"\n",
"print('{:>5,} training samples'.format(train_size))\n",
"print('{:>5,} validation samples'.format(val_size))"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"id": "vX-uxFqkl5rw",
"outputId": "7c83eac7-8c5c-4910-a7b9-799130dde915"
},
"outputs": [
{
"data": {
"text/plain": [
"(tensor([ 7636, 1736, 536, 30, 6072, 263, 4090, 1076, 330, 20777,\n",
" 35, 203, 16488, 1633, 30, 225, 624, 1076, 18, 4651,\n",
" 288, 497, 8427, 330, 19241, 3239, 18, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256, 50256,\n",
" 50256, 50256]),\n",
" tensor([1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,\n",
" 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
" 0, 0, 0, 0, 0, 0, 0, 0]))"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dataset[0]"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {
"id": "4LDKgbSAcPo8"
},
"outputs": [],
"source": [
"batch_size = 8\n",
"\n",
"# Create the DataLoaders for our training and validation datasets.\n",
"# We'll take training samples in random order.\n",
"train_dataloader = DataLoader(\n",
" train_dataset, # The training samples.\n",
" sampler = RandomSampler(train_dataset), # Select batches randomly\n",
" batch_size = batch_size # Trains with this batch size.\n",
" )\n",
"\n",
"# For validation the order doesn't matter, so we'll just read them sequentially.\n",
"validation_dataloader = DataLoader(\n",
" val_dataset, # The validation samples.\n",
" sampler = SequentialSampler(val_dataset), # Pull out batches sequentially.\n",
" batch_size = batch_size # Evaluate with this batch size.\n",
" )"
]
},
{
"cell_type": "markdown",
"metadata": {
"id": "a5NTJK7HVjYD"
},
"source": [
"# Fine-tuning"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {
"id": "TnPudHlZVmaA"
},
"outputs": [],
"source": [
"# some parameters I cooked up that work reasonably well\n",
"\n",
"epochs = 10\n",
"learning_rate = 0.001\n",
"warmup_steps = 1e2\n",
"epsilon = 1e-8"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"id": "ZPic7oqNdGcH",
"outputId": "11bb22bf-31a5-4855-d35d-79fdd14a7cce"
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/usr/local/Caskroom/miniforge/base/envs/ai_env/lib/python3.8/site-packages/transformers/optimization.py:411: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
" warnings.warn(\n"
]
}
],
"source": [
"from transformers import AdamW, get_linear_schedule_with_warmup\n",
"\n",
"# Note: AdamW is a class from the huggingface library (as opposed to pytorch)\n",
"optimizer = AdamW(model.parameters(),\n",
" lr = learning_rate,\n",
" eps = epsilon\n",
" )"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {
"id": "u-zq78GveBbk"
},
"outputs": [],
"source": [
"# Total number of training steps is [number of batches] x [number of epochs].\n",
"# (Note that this is not the same as the number of training samples).\n",
"total_steps = len(train_dataloader) * epochs\n",
"\n",
"# Create the learning rate scheduler.\n",
"# This changes the learning rate as the training loop progresses\n",
"scheduler = get_linear_schedule_with_warmup(optimizer,\n",
" num_warmup_steps = warmup_steps,\n",
" num_training_steps = total_steps)"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"id": "52TDlVRadJCq",
"outputId": "a60440b3-a297-4af3-905b-ce47c3cce6f7"
},
"outputs": [
{
"data": {
"text/plain": [
"GPT2LMHeadModel(\n",
" (transformer): GPT2Model(\n",
" (wte): Embedding(50257, 768)\n",
" (wpe): Embedding(1024, 768)\n",
" (drop): Dropout(p=0.0, inplace=False)\n",
" (h): ModuleList(\n",
" (0): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (1): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (2): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (3): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (4): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (5): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (6): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (7): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (8): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (9): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (10): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" (11): GPT2Block(\n",
" (ln_1): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (attn): GPT2Attention(\n",
" (c_attn): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (attn_dropout): Dropout(p=0.0, inplace=False)\n",
" (resid_dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" (ln_2): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" (mlp): GPT2MLP(\n",
" (c_fc): Conv1D()\n",
" (c_proj): Conv1D()\n",
" (act): NewGELUActivation()\n",
" (dropout): Dropout(p=0.0, inplace=False)\n",
" )\n",
" )\n",
" )\n",
" (ln_f): LayerNorm((768,), eps=1e-05, elementwise_affine=True)\n",
" )\n",
" (lm_head): Linear(in_features=768, out_features=50257, bias=False)\n",
")"
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"import datetime\n",
"import time\n",
"import random\n",
"\n",
"def format_time(elapsed):\n",
" return str(datetime.timedelta(seconds=int(round((elapsed)))))\n",
"\n",
"device = torch.device(\"mps\")\n",
"model.to(device)"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"id": "pPNGSJoadS9V",
"outputId": "f012a036-80ed-499a-8323-25673d0724a2",
"pycharm": {
"is_executing": true
}
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"\n",
"======== Epoch 1 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 2.44\n",
" Training epoch took: 0:01:47\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.26\n",
" Validation took: 0:00:05\n",
"\n",
"======== Epoch 2 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 0.14\n",
" Training epoch took: 0:01:59\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.14\n",
" Validation took: 0:00:05\n",
"\n",
"======== Epoch 3 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 0.08\n",
" Training epoch took: 0:01:57\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.13\n",
" Validation took: 0:00:04\n",
"\n",
"======== Epoch 4 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 0.06\n",
" Training epoch took: 0:01:48\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.13\n",
" Validation took: 0:00:04\n",
"\n",
"======== Epoch 5 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 0.05\n",
" Training epoch took: 0:01:54\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.14\n",
" Validation took: 0:00:05\n",
"\n",
"======== Epoch 6 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 0.04\n",
" Training epoch took: 0:01:45\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.15\n",
" Validation took: 0:00:04\n",
"\n",
"======== Epoch 7 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 0.03\n",
" Training epoch took: 0:02:03\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.15\n",
" Validation took: 0:00:05\n",
"\n",
"======== Epoch 8 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 0.02\n",
" Training epoch took: 0:01:48\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.15\n",
" Validation took: 0:00:03\n",
"\n",
"======== Epoch 9 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 0.01\n",
" Training epoch took: 0:01:59\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.16\n",
" Validation took: 0:00:05\n",
"\n",
"======== Epoch 10 / 10 ========\n",
"Training...\n",
"\n",
" Average training loss: 0.01\n",
" Training epoch took: 0:01:50\n",
"\n",
"Running Validation...\n",
" Validation Loss: 0.16\n",
" Validation took: 0:00:04\n",
"\n",
"Training complete!\n",
"Total training took 0:19:35 (h:mm:ss)\n"
]
}
],
"source": [
"total_t0 = time.time()\n",
"\n",
"training_stats = []\n",
"\n",
"model = model.to(device)\n",
"\n",
"for epoch_i in range(0, epochs):\n",
"\n",
" # ========================================\n",
" # Training\n",
" # ========================================\n",
"\n",
" print(\"\")\n",
" print('======== Epoch {:} / {:} ========'.format(epoch_i + 1, epochs))\n",
" print('Training...')\n",
"\n",
" t0 = time.time()\n",
"\n",
" total_train_loss = 0\n",
"\n",
" model.train()\n",
"\n",
" for step, batch in enumerate(train_dataloader):\n",
"\n",
" b_input_ids = batch[0].to(device)\n",
" b_labels = batch[0].to(device)\n",
" b_masks = batch[1].to(device)\n",
"\n",
" model.zero_grad()\n",
"\n",
" outputs = model( b_input_ids,\n",
" labels=b_labels,\n",
" attention_mask = b_masks,\n",
" token_type_ids=None\n",
" )\n",
"\n",
" loss = outputs[0]\n",
"\n",
" batch_loss = loss.item()\n",
" total_train_loss += batch_loss\n",
"\n",
" loss.backward()\n",
"\n",
" optimizer.step()\n",
"\n",
" scheduler.step()\n",
"\n",
" # Calculate the average loss over all of the batches.\n",
" avg_train_loss = total_train_loss / len(train_dataloader)\n",
"\n",
" # Measure how long this epoch took.\n",
" training_time = format_time(time.time() - t0)\n",
"\n",
" print(\"\")\n",
" print(\" Average training loss: {0:.2f}\".format(avg_train_loss))\n",
" print(\" Training epoch took: {:}\".format(training_time))\n",
"\n",
" # ========================================\n",
" # Validation\n",
" # ========================================\n",
"\n",
" print(\"\")\n",
" print(\"Running Validation...\")\n",
"\n",
" t0 = time.time()\n",
"\n",
" model.eval()\n",
"\n",
" total_eval_loss = 0\n",
" nb_eval_steps = 0\n",
"\n",
" # Evaluate data for one epoch\n",
" for batch in validation_dataloader:\n",
"\n",
" b_input_ids = batch[0].to(device)\n",
" b_labels = batch[0].to(device)\n",
" b_masks = batch[1].to(device)\n",
"\n",
" with torch.no_grad():\n",
"\n",
" outputs = model(b_input_ids,\n",
"# token_type_ids=None,\n",
" attention_mask = b_masks,\n",
" labels=b_labels)\n",
"\n",
" loss = outputs[0]\n",
"\n",
" batch_loss = loss.item()\n",
" total_eval_loss += batch_loss\n",
"\n",
" avg_val_loss = total_eval_loss / len(validation_dataloader)\n",
"\n",
" validation_time = format_time(time.time() - t0)\n",
"\n",
" print(\" Validation Loss: {0:.2f}\".format(avg_val_loss))\n",
" print(\" Validation took: {:}\".format(validation_time))\n",
"\n",
" # Record all statistics from this epoch.\n",
" training_stats.append(\n",
" {\n",
" 'epoch': epoch_i + 1,\n",
" 'Training Loss': avg_train_loss,\n",
" 'Valid. Loss': avg_val_loss,\n",
" 'Training Time': training_time,\n",
" 'Validation Time': validation_time\n",
" }\n",
" )\n",
"\n",
"print(\"\")\n",
"print(\"Training complete!\")\n",
"print(\"Total training took {:} (h:mm:ss)\".format(format_time(time.time()-total_t0)))"
]
},
{
"cell_type": "code",
"execution_count": 14,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"id": "YUAZReU3jPwm",
"outputId": "9fbaccdd-cd3f-4231-f960-e4457f23aeba"
},
"outputs": [],
"source": [
"model.eval()\n",
"\n",
"input_text = \"question: Czy życie ma jakiś sens?\\nanswer:\"\n",
"input_ids = tokenizer.encode(input_text, return_tensors='pt')\n",
"input_ids = input_ids.to(device)\n",
"\n",
"output = model.generate(input_ids, max_length=100, early_stopping=True)\n",
"\n",
"generated_text = tokenizer.decode(output[0], skip_special_tokens=True)\n",
"print(generated_text)\n"
]
},
{
"cell_type": "markdown",
"metadata": {
"id": "PaV10cc01n_N"
},
"source": [
"# Zapisanie modelu"
]
},
{
"cell_type": "code",
"execution_count": 33,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"id": "5Z42j32m1iUF",
"outputId": "3cd21c7c-dd84-4314-8aa4-2671e1f02edd"
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Saving model to model_save/\n"
]
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
{
"data": {
"text/plain": [
"('model_save/tokenizer_config.json',\n",
" 'model_save/special_tokens_map.json',\n",
" 'model_save/vocab.json',\n",
" 'model_save/merges.txt',\n",
" 'model_save/added_tokens.json',\n",
" 'model_save/tokenizer.json')"
]
},
"execution_count": 33,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"import os\n",
"\n",
"# Saving best-practices: if you use defaults names for the model, you can reload it using from_pretrained()\n",
"\n",
"output_dir = 'model_save/'\n",
"\n",
"# Create output directory if needed\n",
"if not os.path.exists(output_dir):\n",
" os.makedirs(output_dir)\n",
"\n",
"print(\"Saving model to %s\" % output_dir)\n",
"\n",
"# Save a trained model, configuration and tokenizer using `save_pretrained()`.\n",
"# They can then be reloaded using `from_pretrained()`\n",
"model_to_save = model.module if hasattr(model, 'module') else model # Take care of distributed/parallel training\n",
"model_to_save.save_pretrained(output_dir)\n",
"tokenizer.save_pretrained(output_dir)"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"accelerator": "GPU",
"colab": {
"gpuType": "T4",
"provenance": []
},
"kernelspec": {
"display_name": "Python 3",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.8.15"
},
"widgets": {
"application/vnd.jupyter.widget-state+json": {
"01e1e799e775450694e2842d87bbc871": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "FloatProgressModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "FloatProgressModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_view_name": "ProgressView",
"bar_style": "success",
2023-06-18 18:22:31 +02:00
"description": "",
"description_tooltip": null,
2023-06-18 22:44:55 +02:00
"layout": "IPY_MODEL_b7b911c6bca94858bb93ffbcb1daa736",
"max": 208,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_4b7636fbfe854056acadd394d71cde75",
"value": 208
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"04e5f6b3190740dd85bedac661c67770": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "FloatProgressModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
2023-06-18 22:44:55 +02:00
"layout": "IPY_MODEL_7e3d164400b342c897b4e647da36a02e",
"max": 864,
2023-06-18 18:22:31 +02:00
"min": 0,
"orientation": "horizontal",
2023-06-18 22:44:55 +02:00
"style": "IPY_MODEL_eadd02efcb204b20b3bfd8e99cde9ae3",
"value": 864
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"05032586bc4d4f8c9a1fa023695e60ec": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
2023-06-18 22:44:55 +02:00
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"06b012d7bd5b418eb74d89ba51dbc690": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "DescriptionStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"083cd7a3ebb34bbf8940af58359a4848": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"0853024b81894cc79c7f6b8de97c5c5b": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"08c86037bfe442079bb79321147a73df": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"state": {
2023-06-18 22:44:55 +02:00
"_dom_classes": [],
2023-06-18 18:22:31 +02:00
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
2023-06-18 22:44:55 +02:00
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_17b70c7ee49f477cacf15abe01d88905",
"placeholder": " ",
"style": "IPY_MODEL_7c0ca4701ce64754b5f31663458e925b",
"value": " 90.0/90.0 [00:00<00:00, 5.53kB/s]"
}
},
"0f75959ab6364a60b229051f0d5b2c68": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_7e58b084511e4232a0d197539306c57f",
"placeholder": " ",
"style": "IPY_MODEL_7e8ca657aedb41da9a99c3d3d648ea00",
"value": " 547k/547k [00:00<00:00, 23.4MB/s]"
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"109145210ff64132a36601470b3e24e6": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"1498b932de1b4a5f922395ecf3b437a9": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"14b26d9b078f4a919f09f8133e5dd22d": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"164ae1d73d4b461fb27c0401b8ce09fe": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"17b70c7ee49f477cacf15abe01d88905": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"1eefecffe6124ad6b835ed579a0adfa5": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"2264a5b9de1d4e93acbdbd84c3abf040": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"244faf9363794c0a86175f72fb63655f": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"state": {
2023-06-18 22:44:55 +02:00
"_dom_classes": [],
2023-06-18 18:22:31 +02:00
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_afc4c68e30a14d74b7c1547f02570baf",
"placeholder": " ",
"style": "IPY_MODEL_57763424d94a4384b4fa4c762062b6ba",
"value": " 208/208 [00:00<00:00, 7.73kB/s]"
}
},
"2a67736c8e3a481aa139b021a89140ab": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "DescriptionStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"2e154a9d0eeb45c38728084edb841a29": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"2fa8106d87594af283e5b74915003783": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_f125275065c64b6ca55f0767737a488a",
"placeholder": " ",
"style": "IPY_MODEL_06b012d7bd5b418eb74d89ba51dbc690",
"value": "Downloading config.json: 100%"
}
},
"31ec83a1244d416ba8cfe922748b7e55": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HBoxModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_3d41103299d5441184b2890a8a52b6ec",
"IPY_MODEL_01e1e799e775450694e2842d87bbc871",
"IPY_MODEL_244faf9363794c0a86175f72fb63655f"
],
"layout": "IPY_MODEL_14b26d9b078f4a919f09f8133e5dd22d"
}
},
"3219d928e9e14e4ba95bf2aad70162a3": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_98e047a8134f4502bb134beb26ffe821",
"placeholder": " ",
"style": "IPY_MODEL_ad3e29e3250a4323b715a7ffe279c799",
"value": " 1.54M/1.54M [00:00<00:00, 54.3MB/s]"
}
},
"3530c50e41b54531b12d04c807d3924a": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_59d4ec3a13844c878d4e95896a37121d",
"placeholder": " ",
"style": "IPY_MODEL_1498b932de1b4a5f922395ecf3b437a9",
"value": "Downloading tokenizer.json: 100%"
}
},
"367f3aae32ab4e1b9f67f3cd29299c5b": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "ProgressStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "ProgressStyleModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
2023-06-18 22:44:55 +02:00
"bar_color": null,
2023-06-18 18:22:31 +02:00
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"37c645ebeb934c8db572d4b4da63f280": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_2264a5b9de1d4e93acbdbd84c3abf040",
"placeholder": " ",
"style": "IPY_MODEL_e863997d8ce142798230810e384323ba",
"value": " 864/864 [00:00<00:00, 36.3kB/s]"
}
},
"3a9bbce5adf04b77beed6eb10211551f": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HBoxModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
2023-06-18 22:44:55 +02:00
"IPY_MODEL_9125492ba517409eb77722982d57b948",
"IPY_MODEL_ff2160ef3ab14d4682cfbb1b878af62f",
"IPY_MODEL_52d637c25ad84c6fae643fe7f687f63a"
2023-06-18 18:22:31 +02:00
],
2023-06-18 22:44:55 +02:00
"layout": "IPY_MODEL_a87573424cf0463a85b56271931d6dc8"
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"3ade165824644044bb922256c3773156": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HBoxModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "HBoxModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_6c924e348934452887581e23151c7ebb",
"IPY_MODEL_85a446e817c943c7a26e40a7ad8f511f",
"IPY_MODEL_08c86037bfe442079bb79321147a73df"
],
"layout": "IPY_MODEL_d3f1817bcb0a4e8a85e0515898c13850"
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"3b6bfbe260a9403c8216269b5032cde4": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_view_name": "HTMLView",
2023-06-18 18:22:31 +02:00
"description": "",
"description_tooltip": null,
2023-06-18 22:44:55 +02:00
"layout": "IPY_MODEL_eb4e61e04bc04929be057a5a960feb9d",
"placeholder": " ",
"style": "IPY_MODEL_b7ef949a1eb0469fb0bd1be5256fa79a",
"value": "Downloading merges.txt: 100%"
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"3d41103299d5441184b2890a8a52b6ec": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
2023-06-18 22:44:55 +02:00
"layout": "IPY_MODEL_109145210ff64132a36601470b3e24e6",
2023-06-18 18:22:31 +02:00
"placeholder": " ",
2023-06-18 22:44:55 +02:00
"style": "IPY_MODEL_1eefecffe6124ad6b835ed579a0adfa5",
"value": "Downloading tokenizer_config.json: 100%"
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"4757bdb315e04fb982ac45e0a26a7c2d": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"4b7636fbfe854056acadd394d71cde75": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "ProgressStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"4e16ca13c2dd46069b65dd48f3da8790": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "ProgressStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"52d637c25ad84c6fae643fe7f687f63a": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_b6aa40c7501f44178f14ac88b63f57cb",
"placeholder": " ",
"style": "IPY_MODEL_984a17db21ee4aa898323ecde9c14f16",
"value": " 888k/888k [00:00<00:00, 30.5MB/s]"
}
},
"53f98231a2c140efbd0a1d2d25367b1f": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"57763424d94a4384b4fa4c762062b6ba": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"59d4ec3a13844c878d4e95896a37121d": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"5c71295523ea4561a6fe8534c0b160e2": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HBoxModel",
2023-06-18 18:22:31 +02:00
"state": {
2023-06-18 22:44:55 +02:00
"_dom_classes": [],
2023-06-18 18:22:31 +02:00
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "HBoxModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
2023-06-18 22:44:55 +02:00
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_c62c829fa4f346f4966f68e020c50813",
"IPY_MODEL_f10ed53b98304b6197789308330e1bf8",
"IPY_MODEL_9516994367bc488faeae786254eff8c7"
],
"layout": "IPY_MODEL_f95ffcc1b9564519aa1f1c81e2d16dbf"
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"5cfa6f79da7e47639bfdea6d8f70dd7d": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HBoxModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_3530c50e41b54531b12d04c807d3924a",
"IPY_MODEL_b6afee105c69499f98cf0544ffe325cb",
"IPY_MODEL_3219d928e9e14e4ba95bf2aad70162a3"
],
"layout": "IPY_MODEL_0853024b81894cc79c7f6b8de97c5c5b"
}
},
"6bb99699d0614c83b588a7dd65351c1c": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
2023-06-18 22:44:55 +02:00
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"6c924e348934452887581e23151c7ebb": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
2023-06-18 22:44:55 +02:00
"layout": "IPY_MODEL_2e154a9d0eeb45c38728084edb841a29",
2023-06-18 18:22:31 +02:00
"placeholder": " ",
2023-06-18 22:44:55 +02:00
"style": "IPY_MODEL_2a67736c8e3a481aa139b021a89140ab",
"value": "Downloading (…)cial_tokens_map.json: 100%"
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"6e3c14738f864803b0f95cd940f23d9e": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
2023-06-18 22:44:55 +02:00
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"7c0ca4701ce64754b5f31663458e925b": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
2023-06-18 22:44:55 +02:00
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"7e3d164400b342c897b4e647da36a02e": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"7e56e3fd676440d0a23ca09f8b5c7d4e": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"7e58b084511e4232a0d197539306c57f": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"7e8ca657aedb41da9a99c3d3d648ea00": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"825fd5e9a017439995c67dcb3a7736b9": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"855d7b31b1a44fb9b667e84f30bd121a": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "ProgressStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "ProgressStyleModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
2023-06-18 22:44:55 +02:00
"bar_color": null,
2023-06-18 18:22:31 +02:00
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"85a446e817c943c7a26e40a7ad8f511f": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "FloatProgressModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "FloatProgressModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_6bb99699d0614c83b588a7dd65351c1c",
"max": 90,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_f380816f81d046b880b12a429d624c2f",
"value": 90
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"8adaa113d54247388e1355331451926a": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "FloatProgressModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "FloatProgressModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_view_name": "ProgressView",
"bar_style": "success",
2023-06-18 18:22:31 +02:00
"description": "",
"description_tooltip": null,
2023-06-18 22:44:55 +02:00
"layout": "IPY_MODEL_fc1af3db81b243178157ee330f62ff3c",
"max": 510401385,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_a46138f2b04c4418816fa264c3deb892",
"value": 510401385
2023-06-18 18:22:31 +02:00
}
},
2023-06-18 22:44:55 +02:00
"9125492ba517409eb77722982d57b948": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_view_name": "HTMLView",
2023-06-18 18:22:31 +02:00
"description": "",
"description_tooltip": null,
2023-06-18 22:44:55 +02:00
"layout": "IPY_MODEL_95dc4d80e12c4020bdd8f5d849107cf5",
"placeholder": " ",
"style": "IPY_MODEL_c1d658d5f21f4731895b397cc3fcb055",
"value": "Downloading vocab.json: 100%"
2023-06-18 18:22:31 +02:00
}
},
"9516994367bc488faeae786254eff8c7": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HTMLModel",
2023-06-18 18:22:31 +02:00
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_164ae1d73d4b461fb27c0401b8ce09fe",
"placeholder": " ",
"style": "IPY_MODEL_6e3c14738f864803b0f95cd940f23d9e",
"value": " 24.0/24.0 [00:00<00:00, 1.62kB/s]"
}
},
2023-06-18 22:44:55 +02:00
"95dc4d80e12c4020bdd8f5d849107cf5": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
2023-06-18 22:44:55 +02:00
"model_module_version": "1.2.0",
2023-06-18 18:22:31 +02:00
"model_name": "LayoutModel",
2023-06-18 22:44:55 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"984a17db21ee4aa898323ecde9c14f16": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "DescriptionStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"98e047a8134f4502bb134beb26ffe821": {
"model_module": "@jupyter-widgets/base",
2023-06-18 18:22:31 +02:00
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"a46138f2b04c4418816fa264c3deb892": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "ProgressStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"a7d258bfe8644c38a56ca365ea9e4ab1": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "FloatProgressModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_f7687d83ee0149248610c40d4d86d944",
"max": 546522,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_bfa116bd3e144c15b67bd97ff3c85fea",
"value": 546522
}
},
"a87573424cf0463a85b56271931d6dc8": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"ac800b679bdc4382b28cbcf9c68303f0": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HBoxModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_2fa8106d87594af283e5b74915003783",
"IPY_MODEL_04e5f6b3190740dd85bedac661c67770",
"IPY_MODEL_37c645ebeb934c8db572d4b4da63f280"
],
"layout": "IPY_MODEL_4757bdb315e04fb982ac45e0a26a7c2d"
}
},
"ad3e29e3250a4323b715a7ffe279c799": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"afc4c68e30a14d74b7c1547f02570baf": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"b47c3295784648cf8847e198ee33c615": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"b6aa40c7501f44178f14ac88b63f57cb": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"b6afee105c69499f98cf0544ffe325cb": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "FloatProgressModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_083cd7a3ebb34bbf8940af58359a4848",
"max": 1535928,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_4e16ca13c2dd46069b65dd48f3da8790",
"value": 1535928
}
},
"b7b911c6bca94858bb93ffbcb1daa736": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"b7ef949a1eb0469fb0bd1be5256fa79a": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"bab30e40fedb43dc8e0044c80727c38b": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
2023-06-18 22:44:55 +02:00
"bbedc4f5cece4090ad997ce39d65e96a": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_b47c3295784648cf8847e198ee33c615",
"placeholder": " ",
"style": "IPY_MODEL_ee47504dd7274dfb860a5c4355a37295",
"value": " 510M/510M [00:06<00:00, 58.7MB/s]"
}
},
"bfa116bd3e144c15b67bd97ff3c85fea": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "ProgressStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"c09398bd98554499805b5f14270e4248": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"model_name": "HBoxModel",
2023-06-18 18:22:31 +02:00
"state": {
2023-06-18 22:44:55 +02:00
"_dom_classes": [],
2023-06-18 18:22:31 +02:00
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
2023-06-18 22:44:55 +02:00
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_c3b4b0254d8b4e4eb399ca3514d36211",
"IPY_MODEL_8adaa113d54247388e1355331451926a",
"IPY_MODEL_bbedc4f5cece4090ad997ce39d65e96a"
],
"layout": "IPY_MODEL_825fd5e9a017439995c67dcb3a7736b9"
}
},
"c1d658d5f21f4731895b397cc3fcb055": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "DescriptionStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
2023-06-18 18:22:31 +02:00
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
2023-06-18 22:44:55 +02:00
"c3b4b0254d8b4e4eb399ca3514d36211": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_bab30e40fedb43dc8e0044c80727c38b",
"placeholder": " ",
"style": "IPY_MODEL_ffdbfdfd24f3433f9653a3a0b1a177d6",
"value": "Downloading pytorch_model.bin: 100%"
}
},
"c62c829fa4f346f4966f68e020c50813": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HTMLModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_e7fafc300aa749a2bedd750295731307",
"placeholder": " ",
"style": "IPY_MODEL_05032586bc4d4f8c9a1fa023695e60ec",
"value": "Downloading added_tokens.json: 100%"
}
},
"ca47940201884085b556bbc7032f17f2": {
2023-06-18 18:22:31 +02:00
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
2023-06-18 22:44:55 +02:00
"model_name": "LayoutModel",
2023-06-18 18:22:31 +02:00
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
2023-06-18 22:44:55 +02:00
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"d3f1817bcb0a4e8a85e0515898c13850": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"dc277586ba1f4eeda104c895cf9a1626": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "HBoxModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_3b6bfbe260a9403c8216269b5032cde4",
"IPY_MODEL_a7d258bfe8644c38a56ca365ea9e4ab1",
"IPY_MODEL_0f75959ab6364a60b229051f0d5b2c68"
],
"layout": "IPY_MODEL_ca47940201884085b556bbc7032f17f2"
}
},
"e7fafc300aa749a2bedd750295731307": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"e863997d8ce142798230810e384323ba": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "DescriptionStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"eadd02efcb204b20b3bfd8e99cde9ae3": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "ProgressStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"eb4e61e04bc04929be057a5a960feb9d": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"ee47504dd7274dfb860a5c4355a37295": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "DescriptionStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"f10ed53b98304b6197789308330e1bf8": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "FloatProgressModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_7e56e3fd676440d0a23ca09f8b5c7d4e",
"max": 24,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_855d7b31b1a44fb9b667e84f30bd121a",
"value": 24
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"f125275065c64b6ca55f0767737a488a": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"f380816f81d046b880b12a429d624c2f": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "ProgressStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"f7687d83ee0149248610c40d4d86d944": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"f95ffcc1b9564519aa1f1c81e2d16dbf": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"fc1af3db81b243178157ee330f62ff3c": {
"model_module": "@jupyter-widgets/base",
"model_module_version": "1.2.0",
"model_name": "LayoutModel",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"ff2160ef3ab14d4682cfbb1b878af62f": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "FloatProgressModel",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_53f98231a2c140efbd0a1d2d25367b1f",
"max": 888217,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_367f3aae32ab4e1b9f67f3cd29299c5b",
"value": 888217
}
2023-06-18 18:22:31 +02:00
},
2023-06-18 22:44:55 +02:00
"ffdbfdfd24f3433f9653a3a0b1a177d6": {
"model_module": "@jupyter-widgets/controls",
"model_module_version": "1.5.0",
"model_name": "DescriptionStyleModel",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
2023-06-18 18:22:31 +02:00
}
2023-06-18 22:44:55 +02:00
}
2023-06-18 18:22:31 +02:00
}
2023-06-18 22:44:55 +02:00
},
"nbformat": 4,
"nbformat_minor": 0
2023-06-18 18:22:31 +02:00
}