paranormal-or-skeptic/transformery.ipynb
Iwona Christop f8ce7024e4 s443930
2022-06-22 23:34:30 +02:00

1719 lines
82 KiB
Plaintext
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

{
"nbformat": 4,
"nbformat_minor": 0,
"metadata": {
"colab": {
"name": "transformery.ipynb",
"provenance": [],
"collapsed_sections": []
},
"kernelspec": {
"name": "python3",
"display_name": "Python 3"
},
"language_info": {
"name": "python"
},
"gpuClass": "standard",
"accelerator": "GPU",
"widgets": {
"application/vnd.jupyter.widget-state+json": {
"edb0a9e2b5624067bad7e49f7260304e": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_3e3de49abd93447d97d630900c0998a6",
"IPY_MODEL_2d5a1f551f7747e79d7749b7e0bb06c7",
"IPY_MODEL_fca439193c054ca9b016cfe4233e0cef"
],
"layout": "IPY_MODEL_c6a52195933146748c69d158c5fecb36"
}
},
"3e3de49abd93447d97d630900c0998a6": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_9f04902c9f414aafa3138c2ea24c79c4",
"placeholder": "",
"style": "IPY_MODEL_762b7b38f26547cfbc69a23c9caa05db",
"value": "Downloading: 100%"
}
},
"2d5a1f551f7747e79d7749b7e0bb06c7": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_98833c8af5c54a99bf5eea5717cb6907",
"max": 116252865,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_7e67bd6e851d4086b6e4c4c8599a1b0d",
"value": 116252865
}
},
"fca439193c054ca9b016cfe4233e0cef": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_84c7a3e70aa249c8bb4d007d934d2f8d",
"placeholder": "",
"style": "IPY_MODEL_c7994559d8754fdd8936c019beb304b1",
"value": " 111M/111M [00:02<00:00, 45.2MB/s]"
}
},
"c6a52195933146748c69d158c5fecb36": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"9f04902c9f414aafa3138c2ea24c79c4": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"762b7b38f26547cfbc69a23c9caa05db": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"98833c8af5c54a99bf5eea5717cb6907": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"7e67bd6e851d4086b6e4c4c8599a1b0d": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"84c7a3e70aa249c8bb4d007d934d2f8d": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"c7994559d8754fdd8936c019beb304b1": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
}
}
}
},
"cells": [
{
"cell_type": "code",
"source": [
"! python3 -m pip install transformers"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "SdT79WnDl6Tv",
"outputId": "8a5475ba-b438-43b2-8169-bdf38f26b04a"
},
"execution_count": 1,
"outputs": [
{
"output_type": "stream",
"name": "stdout",
"text": [
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
"Collecting transformers\n",
" Downloading transformers-4.20.1-py3-none-any.whl (4.4 MB)\n",
"\u001b[K |████████████████████████████████| 4.4 MB 25.8 MB/s \n",
"\u001b[?25hCollecting huggingface-hub<1.0,>=0.1.0\n",
" Downloading huggingface_hub-0.8.1-py3-none-any.whl (101 kB)\n",
"\u001b[K |████████████████████████████████| 101 kB 14.1 MB/s \n",
"\u001b[?25hRequirement already satisfied: requests in /usr/local/lib/python3.7/dist-packages (from transformers) (2.23.0)\n",
"Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.7/dist-packages (from transformers) (2022.6.2)\n",
"Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.7/dist-packages (from transformers) (4.64.0)\n",
"Collecting tokenizers!=0.11.3,<0.13,>=0.11.1\n",
" Downloading tokenizers-0.12.1-cp37-cp37m-manylinux_2_12_x86_64.manylinux2010_x86_64.whl (6.6 MB)\n",
"\u001b[K |████████████████████████████████| 6.6 MB 56.5 MB/s \n",
"\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.7/dist-packages (from transformers) (1.21.6)\n",
"Requirement already satisfied: importlib-metadata in /usr/local/lib/python3.7/dist-packages (from transformers) (4.11.4)\n",
"Collecting pyyaml>=5.1\n",
" Downloading PyYAML-6.0-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (596 kB)\n",
"\u001b[K |████████████████████████████████| 596 kB 41.7 MB/s \n",
"\u001b[?25hRequirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.7/dist-packages (from transformers) (21.3)\n",
"Requirement already satisfied: filelock in /usr/local/lib/python3.7/dist-packages (from transformers) (3.7.1)\n",
"Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.7/dist-packages (from huggingface-hub<1.0,>=0.1.0->transformers) (4.1.1)\n",
"Requirement already satisfied: pyparsing!=3.0.5,>=2.0.2 in /usr/local/lib/python3.7/dist-packages (from packaging>=20.0->transformers) (3.0.9)\n",
"Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata->transformers) (3.8.0)\n",
"Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests->transformers) (3.0.4)\n",
"Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests->transformers) (2.10)\n",
"Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests->transformers) (2022.6.15)\n",
"Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests->transformers) (1.24.3)\n",
"Installing collected packages: pyyaml, tokenizers, huggingface-hub, transformers\n",
" Attempting uninstall: pyyaml\n",
" Found existing installation: PyYAML 3.13\n",
" Uninstalling PyYAML-3.13:\n",
" Successfully uninstalled PyYAML-3.13\n",
"Successfully installed huggingface-hub-0.8.1 pyyaml-6.0 tokenizers-0.12.1 transformers-4.20.1\n"
]
}
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {
"id": "wRXCvVeYk5bW"
},
"outputs": [],
"source": [
"import csv, lzma\n",
"\n",
"# Reads input from directory and returns a list\n",
"def io_read(dir):\n",
" X = []\n",
" if 'xz' in dir:\n",
" with lzma.open(dir) as f:\n",
" for line in f:\n",
" text = line.decode('utf-8')\n",
" text = text.split('\\t')\n",
" X.append(text)\n",
" else:\n",
" with open(dir) as f:\n",
" for line in f:\n",
" X.append(line.replace('\\n', ''))\n",
" return X\n",
"\n",
"# Takes the output (list) and writes it into directory\n",
"def io_write(output, dir):\n",
" with open(dir, 'w', newline='') as f:\n",
" writer = csv.writer(f)\n",
" writer.writerows(output)"
]
},
{
"cell_type": "code",
"source": [
"x_train = [x[0] for x in io_read('/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/train/in.tsv.xz')]\n",
"y_train = [int(y) for y in io_read('/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/train/expected.tsv')]\n",
"\n",
"# x_dev = [x[0] for x in io_read('/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/dev-0/in.tsv.xz')]\n",
"# y_dev = [int(y) for y in io_read('/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/dev-0/expected.tsv')]\n",
"\n",
"# x_test = [x[0] for x in io_read('/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/test-A/in.tsv.xz')]"
],
"metadata": {
"id": "KOogjYiElR5v"
},
"execution_count": 4,
"outputs": []
},
{
"cell_type": "code",
"source": [
"from transformers import BertTokenizerFast\n",
"\n",
"model_name = \"google/bert_uncased_L-4_H-512_A-8\"\n",
"tokenizer = BertTokenizerFast.from_pretrained(model_name)\n",
"\n",
"train_encodings = tokenizer(x_train, truncation=True, padding='max_length', max_length=128)"
],
"metadata": {
"id": "2aIRZ0gcLBXg"
},
"execution_count": 6,
"outputs": []
},
{
"cell_type": "code",
"source": [
"import torch\n",
"\n",
"class Dataset(torch.utils.data.Dataset):\n",
" def __init__(self, encodings, labels=None):\n",
" self.encodings = encodings\n",
" self.labels = labels\n",
"\n",
" def __getitem__(self, idx):\n",
" item = {key: torch.tensor(val[idx]) for key, val in self.encodings.items()}\n",
" if self.labels:\n",
" item[\"labels\"] = torch.tensor(self.labels[idx])\n",
" return item\n",
"\n",
" def __len__(self):\n",
" return len(self.encodings[\"input_ids\"])"
],
"metadata": {
"id": "9jNTGg77Elnu"
},
"execution_count": 7,
"outputs": []
},
{
"cell_type": "code",
"source": [
"train_dataset = Dataset(train_encodings, y_train)"
],
"metadata": {
"id": "h88hD-xvLKe0"
},
"execution_count": 8,
"outputs": []
},
{
"cell_type": "code",
"source": [
"from transformers import BertForSequenceClassification\n",
"\n",
"model = BertForSequenceClassification.from_pretrained(model_name)"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 161,
"referenced_widgets": [
"edb0a9e2b5624067bad7e49f7260304e",
"3e3de49abd93447d97d630900c0998a6",
"2d5a1f551f7747e79d7749b7e0bb06c7",
"fca439193c054ca9b016cfe4233e0cef",
"c6a52195933146748c69d158c5fecb36",
"9f04902c9f414aafa3138c2ea24c79c4",
"762b7b38f26547cfbc69a23c9caa05db",
"98833c8af5c54a99bf5eea5717cb6907",
"7e67bd6e851d4086b6e4c4c8599a1b0d",
"84c7a3e70aa249c8bb4d007d934d2f8d",
"c7994559d8754fdd8936c019beb304b1"
]
},
"id": "iLovBI-GnEad",
"outputId": "e2eb76cb-1143-4a8e-ec56-2d48a90427e3"
},
"execution_count": 9,
"outputs": [
{
"output_type": "display_data",
"data": {
"text/plain": [
"Downloading: 0%| | 0.00/111M [00:00<?, ?B/s]"
],
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
"model_id": "edb0a9e2b5624067bad7e49f7260304e"
}
},
"metadata": {}
},
{
"output_type": "stream",
"name": "stderr",
"text": [
"Some weights of the model checkpoint at google/bert_uncased_L-4_H-512_A-8 were not used when initializing BertForSequenceClassification: ['cls.predictions.transform.dense.bias', 'cls.predictions.transform.LayerNorm.bias', 'cls.predictions.transform.dense.weight', 'cls.seq_relationship.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.decoder.bias', 'cls.seq_relationship.weight', 'cls.predictions.bias', 'cls.predictions.decoder.weight']\n",
"- This IS expected if you are initializing BertForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).\n",
"- This IS NOT expected if you are initializing BertForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).\n",
"Some weights of BertForSequenceClassification were not initialized from the model checkpoint at google/bert_uncased_L-4_H-512_A-8 and are newly initialized: ['classifier.bias', 'classifier.weight']\n",
"You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n"
]
}
]
},
{
"cell_type": "code",
"source": [
"for param in model.base_model.parameters():\n",
" param.requires_grad = False"
],
"metadata": {
"id": "XH__qS88LY94"
},
"execution_count": 10,
"outputs": []
},
{
"cell_type": "code",
"source": [
"from transformers import TrainingArguments, Trainer\n",
"\n",
"training_args = TrainingArguments(\n",
" output_dir=\"./results\",\n",
" learning_rate=2e-5,\n",
" per_device_train_batch_size=16,\n",
" num_train_epochs=3,\n",
" weight_decay=0.01,\n",
" warmup_steps=500,\n",
" save_total_limit=1\n",
")\n",
"\n",
"trainer = Trainer(\n",
" model=model,\n",
" args=training_args,\n",
" train_dataset=train_dataset\n",
")"
],
"metadata": {
"id": "NfqNobUtnzbW",
"colab": {
"base_uri": "https://localhost:8080/"
},
"outputId": "a0a099db-7b24-4c66-cad5-4c1beb5d443b"
},
"execution_count": 13,
"outputs": [
{
"output_type": "stream",
"name": "stderr",
"text": [
"PyTorch: setting up devices\n",
"The default value for the training argument `--report_to` will change in v5 (from all installed integrations to none). In v5, you will need to use `--report_to all` to get the same behavior as now. You should start updating your code and make this info disappear :-).\n"
]
}
]
},
{
"cell_type": "code",
"source": [
"trainer.train()"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 1000
},
"id": "x5JXgCjno7IC",
"outputId": "86627a7f-20ec-4ba2-a517-2b04e2626a0e"
},
"execution_count": 14,
"outputs": [
{
"output_type": "stream",
"name": "stderr",
"text": [
"/usr/local/lib/python3.7/dist-packages/transformers/optimization.py:310: FutureWarning: This implementation of AdamW is deprecated and will be removed in a future version. Use the PyTorch implementation torch.optim.AdamW instead, or set `no_deprecation_warning=True` to disable this warning\n",
" FutureWarning,\n",
"***** Running training *****\n",
" Num examples = 289579\n",
" Num Epochs = 3\n",
" Instantaneous batch size per device = 16\n",
" Total train batch size (w. parallel, distributed & accumulation) = 16\n",
" Gradient Accumulation steps = 1\n",
" Total optimization steps = 54297\n"
]
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"<IPython.core.display.HTML object>"
],
"text/html": [
"\n",
" <div>\n",
" \n",
" <progress value='54297' max='54297' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
" [54297/54297 21:16, Epoch 3/3]\n",
" </div>\n",
" <table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: left;\">\n",
" <th>Step</th>\n",
" <th>Training Loss</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <td>500</td>\n",
" <td>0.552400</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1000</td>\n",
" <td>0.542700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>1500</td>\n",
" <td>0.552900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>2000</td>\n",
" <td>0.549600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>2500</td>\n",
" <td>0.548200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>3000</td>\n",
" <td>0.546700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>3500</td>\n",
" <td>0.546100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4000</td>\n",
" <td>0.545600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>4500</td>\n",
" <td>0.544800</td>\n",
" </tr>\n",
" <tr>\n",
" <td>5000</td>\n",
" <td>0.546000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>5500</td>\n",
" <td>0.545800</td>\n",
" </tr>\n",
" <tr>\n",
" <td>6000</td>\n",
" <td>0.541200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>6500</td>\n",
" <td>0.536100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>7000</td>\n",
" <td>0.537200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>7500</td>\n",
" <td>0.545700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8000</td>\n",
" <td>0.543100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>8500</td>\n",
" <td>0.548600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>9000</td>\n",
" <td>0.538600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>9500</td>\n",
" <td>0.540100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>10000</td>\n",
" <td>0.543100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>10500</td>\n",
" <td>0.540700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>11000</td>\n",
" <td>0.541200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>11500</td>\n",
" <td>0.542100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>12000</td>\n",
" <td>0.538600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>12500</td>\n",
" <td>0.535000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>13000</td>\n",
" <td>0.538300</td>\n",
" </tr>\n",
" <tr>\n",
" <td>13500</td>\n",
" <td>0.546500</td>\n",
" </tr>\n",
" <tr>\n",
" <td>14000</td>\n",
" <td>0.541200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>14500</td>\n",
" <td>0.530200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>15000</td>\n",
" <td>0.532000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>15500</td>\n",
" <td>0.535000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16000</td>\n",
" <td>0.540900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>16500</td>\n",
" <td>0.543100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>17000</td>\n",
" <td>0.538300</td>\n",
" </tr>\n",
" <tr>\n",
" <td>17500</td>\n",
" <td>0.544900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>18000</td>\n",
" <td>0.538400</td>\n",
" </tr>\n",
" <tr>\n",
" <td>18500</td>\n",
" <td>0.539000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>19000</td>\n",
" <td>0.544100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>19500</td>\n",
" <td>0.541900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>20000</td>\n",
" <td>0.537700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>20500</td>\n",
" <td>0.527200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>21000</td>\n",
" <td>0.535400</td>\n",
" </tr>\n",
" <tr>\n",
" <td>21500</td>\n",
" <td>0.542500</td>\n",
" </tr>\n",
" <tr>\n",
" <td>22000</td>\n",
" <td>0.533400</td>\n",
" </tr>\n",
" <tr>\n",
" <td>22500</td>\n",
" <td>0.534400</td>\n",
" </tr>\n",
" <tr>\n",
" <td>23000</td>\n",
" <td>0.534100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>23500</td>\n",
" <td>0.538500</td>\n",
" </tr>\n",
" <tr>\n",
" <td>24000</td>\n",
" <td>0.533100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>24500</td>\n",
" <td>0.532800</td>\n",
" </tr>\n",
" <tr>\n",
" <td>25000</td>\n",
" <td>0.542600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>25500</td>\n",
" <td>0.531200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>26000</td>\n",
" <td>0.532100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>26500</td>\n",
" <td>0.535500</td>\n",
" </tr>\n",
" <tr>\n",
" <td>27000</td>\n",
" <td>0.543600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>27500</td>\n",
" <td>0.527600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>28000</td>\n",
" <td>0.529800</td>\n",
" </tr>\n",
" <tr>\n",
" <td>28500</td>\n",
" <td>0.537800</td>\n",
" </tr>\n",
" <tr>\n",
" <td>29000</td>\n",
" <td>0.537900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>29500</td>\n",
" <td>0.538700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>30000</td>\n",
" <td>0.535400</td>\n",
" </tr>\n",
" <tr>\n",
" <td>30500</td>\n",
" <td>0.544600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>31000</td>\n",
" <td>0.537100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>31500</td>\n",
" <td>0.529200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>32000</td>\n",
" <td>0.539300</td>\n",
" </tr>\n",
" <tr>\n",
" <td>32500</td>\n",
" <td>0.534800</td>\n",
" </tr>\n",
" <tr>\n",
" <td>33000</td>\n",
" <td>0.538100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>33500</td>\n",
" <td>0.536100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>34000</td>\n",
" <td>0.540800</td>\n",
" </tr>\n",
" <tr>\n",
" <td>34500</td>\n",
" <td>0.544600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>35000</td>\n",
" <td>0.541200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>35500</td>\n",
" <td>0.536500</td>\n",
" </tr>\n",
" <tr>\n",
" <td>36000</td>\n",
" <td>0.531600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>36500</td>\n",
" <td>0.541100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>37000</td>\n",
" <td>0.535600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>37500</td>\n",
" <td>0.533100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>38000</td>\n",
" <td>0.530700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>38500</td>\n",
" <td>0.526200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>39000</td>\n",
" <td>0.539200</td>\n",
" </tr>\n",
" <tr>\n",
" <td>39500</td>\n",
" <td>0.530500</td>\n",
" </tr>\n",
" <tr>\n",
" <td>40000</td>\n",
" <td>0.535000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>40500</td>\n",
" <td>0.532100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>41000</td>\n",
" <td>0.523400</td>\n",
" </tr>\n",
" <tr>\n",
" <td>41500</td>\n",
" <td>0.533900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>42000</td>\n",
" <td>0.534600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>42500</td>\n",
" <td>0.530300</td>\n",
" </tr>\n",
" <tr>\n",
" <td>43000</td>\n",
" <td>0.543600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>43500</td>\n",
" <td>0.531700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>44000</td>\n",
" <td>0.535400</td>\n",
" </tr>\n",
" <tr>\n",
" <td>44500</td>\n",
" <td>0.524000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>45000</td>\n",
" <td>0.534900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>45500</td>\n",
" <td>0.537900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>46000</td>\n",
" <td>0.539000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>46500</td>\n",
" <td>0.537600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>47000</td>\n",
" <td>0.535000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>47500</td>\n",
" <td>0.540500</td>\n",
" </tr>\n",
" <tr>\n",
" <td>48000</td>\n",
" <td>0.535000</td>\n",
" </tr>\n",
" <tr>\n",
" <td>48500</td>\n",
" <td>0.540900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>49000</td>\n",
" <td>0.535700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>49500</td>\n",
" <td>0.531900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>50000</td>\n",
" <td>0.535700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>50500</td>\n",
" <td>0.531900</td>\n",
" </tr>\n",
" <tr>\n",
" <td>51000</td>\n",
" <td>0.535600</td>\n",
" </tr>\n",
" <tr>\n",
" <td>51500</td>\n",
" <td>0.538700</td>\n",
" </tr>\n",
" <tr>\n",
" <td>52000</td>\n",
" <td>0.536400</td>\n",
" </tr>\n",
" <tr>\n",
" <td>52500</td>\n",
" <td>0.536500</td>\n",
" </tr>\n",
" <tr>\n",
" <td>53000</td>\n",
" <td>0.539100</td>\n",
" </tr>\n",
" <tr>\n",
" <td>53500</td>\n",
" <td>0.526300</td>\n",
" </tr>\n",
" <tr>\n",
" <td>54000</td>\n",
" <td>0.525300</td>\n",
" </tr>\n",
" </tbody>\n",
"</table><p>"
]
},
"metadata": {}
},
{
"output_type": "stream",
"name": "stderr",
"text": [
"Saving model checkpoint to ./results/checkpoint-500\n",
"Configuration saved in ./results/checkpoint-500/config.json\n",
"Model weights saved in ./results/checkpoint-500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-18000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-1000\n",
"Configuration saved in ./results/checkpoint-1000/config.json\n",
"Model weights saved in ./results/checkpoint-1000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-1500\n",
"Configuration saved in ./results/checkpoint-1500/config.json\n",
"Model weights saved in ./results/checkpoint-1500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-1000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-2000\n",
"Configuration saved in ./results/checkpoint-2000/config.json\n",
"Model weights saved in ./results/checkpoint-2000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-1500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-2500\n",
"Configuration saved in ./results/checkpoint-2500/config.json\n",
"Model weights saved in ./results/checkpoint-2500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-2000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-3000\n",
"Configuration saved in ./results/checkpoint-3000/config.json\n",
"Model weights saved in ./results/checkpoint-3000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-2500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-3500\n",
"Configuration saved in ./results/checkpoint-3500/config.json\n",
"Model weights saved in ./results/checkpoint-3500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-3000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-4000\n",
"Configuration saved in ./results/checkpoint-4000/config.json\n",
"Model weights saved in ./results/checkpoint-4000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-3500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-4500\n",
"Configuration saved in ./results/checkpoint-4500/config.json\n",
"Model weights saved in ./results/checkpoint-4500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-4000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-5000\n",
"Configuration saved in ./results/checkpoint-5000/config.json\n",
"Model weights saved in ./results/checkpoint-5000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-4500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-5500\n",
"Configuration saved in ./results/checkpoint-5500/config.json\n",
"Model weights saved in ./results/checkpoint-5500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-5000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-6000\n",
"Configuration saved in ./results/checkpoint-6000/config.json\n",
"Model weights saved in ./results/checkpoint-6000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-5500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-6500\n",
"Configuration saved in ./results/checkpoint-6500/config.json\n",
"Model weights saved in ./results/checkpoint-6500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-6000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-7000\n",
"Configuration saved in ./results/checkpoint-7000/config.json\n",
"Model weights saved in ./results/checkpoint-7000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-6500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-7500\n",
"Configuration saved in ./results/checkpoint-7500/config.json\n",
"Model weights saved in ./results/checkpoint-7500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-7000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-8000\n",
"Configuration saved in ./results/checkpoint-8000/config.json\n",
"Model weights saved in ./results/checkpoint-8000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-7500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-8500\n",
"Configuration saved in ./results/checkpoint-8500/config.json\n",
"Model weights saved in ./results/checkpoint-8500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-8000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-9000\n",
"Configuration saved in ./results/checkpoint-9000/config.json\n",
"Model weights saved in ./results/checkpoint-9000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-8500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-9500\n",
"Configuration saved in ./results/checkpoint-9500/config.json\n",
"Model weights saved in ./results/checkpoint-9500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-9000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-10000\n",
"Configuration saved in ./results/checkpoint-10000/config.json\n",
"Model weights saved in ./results/checkpoint-10000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-9500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-10500\n",
"Configuration saved in ./results/checkpoint-10500/config.json\n",
"Model weights saved in ./results/checkpoint-10500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-10000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-11000\n",
"Configuration saved in ./results/checkpoint-11000/config.json\n",
"Model weights saved in ./results/checkpoint-11000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-10500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-11500\n",
"Configuration saved in ./results/checkpoint-11500/config.json\n",
"Model weights saved in ./results/checkpoint-11500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-11000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-12000\n",
"Configuration saved in ./results/checkpoint-12000/config.json\n",
"Model weights saved in ./results/checkpoint-12000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-11500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-12500\n",
"Configuration saved in ./results/checkpoint-12500/config.json\n",
"Model weights saved in ./results/checkpoint-12500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-12000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-13000\n",
"Configuration saved in ./results/checkpoint-13000/config.json\n",
"Model weights saved in ./results/checkpoint-13000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-12500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-13500\n",
"Configuration saved in ./results/checkpoint-13500/config.json\n",
"Model weights saved in ./results/checkpoint-13500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-13000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-14000\n",
"Configuration saved in ./results/checkpoint-14000/config.json\n",
"Model weights saved in ./results/checkpoint-14000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-13500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-14500\n",
"Configuration saved in ./results/checkpoint-14500/config.json\n",
"Model weights saved in ./results/checkpoint-14500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-14000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-15000\n",
"Configuration saved in ./results/checkpoint-15000/config.json\n",
"Model weights saved in ./results/checkpoint-15000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-14500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-15500\n",
"Configuration saved in ./results/checkpoint-15500/config.json\n",
"Model weights saved in ./results/checkpoint-15500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-15000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-16000\n",
"Configuration saved in ./results/checkpoint-16000/config.json\n",
"Model weights saved in ./results/checkpoint-16000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-15500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-16500\n",
"Configuration saved in ./results/checkpoint-16500/config.json\n",
"Model weights saved in ./results/checkpoint-16500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-16000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-17000\n",
"Configuration saved in ./results/checkpoint-17000/config.json\n",
"Model weights saved in ./results/checkpoint-17000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-16500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-17500\n",
"Configuration saved in ./results/checkpoint-17500/config.json\n",
"Model weights saved in ./results/checkpoint-17500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-17000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-18000\n",
"Configuration saved in ./results/checkpoint-18000/config.json\n",
"Model weights saved in ./results/checkpoint-18000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-17500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-18500\n",
"Configuration saved in ./results/checkpoint-18500/config.json\n",
"Model weights saved in ./results/checkpoint-18500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-18000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-19000\n",
"Configuration saved in ./results/checkpoint-19000/config.json\n",
"Model weights saved in ./results/checkpoint-19000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-18500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-19500\n",
"Configuration saved in ./results/checkpoint-19500/config.json\n",
"Model weights saved in ./results/checkpoint-19500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-19000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-20000\n",
"Configuration saved in ./results/checkpoint-20000/config.json\n",
"Model weights saved in ./results/checkpoint-20000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-19500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-20500\n",
"Configuration saved in ./results/checkpoint-20500/config.json\n",
"Model weights saved in ./results/checkpoint-20500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-20000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-21000\n",
"Configuration saved in ./results/checkpoint-21000/config.json\n",
"Model weights saved in ./results/checkpoint-21000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-20500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-21500\n",
"Configuration saved in ./results/checkpoint-21500/config.json\n",
"Model weights saved in ./results/checkpoint-21500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-21000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-22000\n",
"Configuration saved in ./results/checkpoint-22000/config.json\n",
"Model weights saved in ./results/checkpoint-22000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-21500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-22500\n",
"Configuration saved in ./results/checkpoint-22500/config.json\n",
"Model weights saved in ./results/checkpoint-22500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-22000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-23000\n",
"Configuration saved in ./results/checkpoint-23000/config.json\n",
"Model weights saved in ./results/checkpoint-23000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-22500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-23500\n",
"Configuration saved in ./results/checkpoint-23500/config.json\n",
"Model weights saved in ./results/checkpoint-23500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-23000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-24000\n",
"Configuration saved in ./results/checkpoint-24000/config.json\n",
"Model weights saved in ./results/checkpoint-24000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-23500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-24500\n",
"Configuration saved in ./results/checkpoint-24500/config.json\n",
"Model weights saved in ./results/checkpoint-24500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-24000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-25000\n",
"Configuration saved in ./results/checkpoint-25000/config.json\n",
"Model weights saved in ./results/checkpoint-25000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-24500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-25500\n",
"Configuration saved in ./results/checkpoint-25500/config.json\n",
"Model weights saved in ./results/checkpoint-25500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-25000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-26000\n",
"Configuration saved in ./results/checkpoint-26000/config.json\n",
"Model weights saved in ./results/checkpoint-26000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-25500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-26500\n",
"Configuration saved in ./results/checkpoint-26500/config.json\n",
"Model weights saved in ./results/checkpoint-26500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-26000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-27000\n",
"Configuration saved in ./results/checkpoint-27000/config.json\n",
"Model weights saved in ./results/checkpoint-27000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-26500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-27500\n",
"Configuration saved in ./results/checkpoint-27500/config.json\n",
"Model weights saved in ./results/checkpoint-27500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-27000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-28000\n",
"Configuration saved in ./results/checkpoint-28000/config.json\n",
"Model weights saved in ./results/checkpoint-28000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-27500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-28500\n",
"Configuration saved in ./results/checkpoint-28500/config.json\n",
"Model weights saved in ./results/checkpoint-28500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-28000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-29000\n",
"Configuration saved in ./results/checkpoint-29000/config.json\n",
"Model weights saved in ./results/checkpoint-29000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-28500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-29500\n",
"Configuration saved in ./results/checkpoint-29500/config.json\n",
"Model weights saved in ./results/checkpoint-29500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-29000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-30000\n",
"Configuration saved in ./results/checkpoint-30000/config.json\n",
"Model weights saved in ./results/checkpoint-30000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-29500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-30500\n",
"Configuration saved in ./results/checkpoint-30500/config.json\n",
"Model weights saved in ./results/checkpoint-30500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-30000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-31000\n",
"Configuration saved in ./results/checkpoint-31000/config.json\n",
"Model weights saved in ./results/checkpoint-31000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-30500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-31500\n",
"Configuration saved in ./results/checkpoint-31500/config.json\n",
"Model weights saved in ./results/checkpoint-31500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-31000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-32000\n",
"Configuration saved in ./results/checkpoint-32000/config.json\n",
"Model weights saved in ./results/checkpoint-32000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-31500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-32500\n",
"Configuration saved in ./results/checkpoint-32500/config.json\n",
"Model weights saved in ./results/checkpoint-32500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-32000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-33000\n",
"Configuration saved in ./results/checkpoint-33000/config.json\n",
"Model weights saved in ./results/checkpoint-33000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-32500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-33500\n",
"Configuration saved in ./results/checkpoint-33500/config.json\n",
"Model weights saved in ./results/checkpoint-33500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-33000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-34000\n",
"Configuration saved in ./results/checkpoint-34000/config.json\n",
"Model weights saved in ./results/checkpoint-34000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-33500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-34500\n",
"Configuration saved in ./results/checkpoint-34500/config.json\n",
"Model weights saved in ./results/checkpoint-34500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-34000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-35000\n",
"Configuration saved in ./results/checkpoint-35000/config.json\n",
"Model weights saved in ./results/checkpoint-35000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-34500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-35500\n",
"Configuration saved in ./results/checkpoint-35500/config.json\n",
"Model weights saved in ./results/checkpoint-35500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-35000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-36000\n",
"Configuration saved in ./results/checkpoint-36000/config.json\n",
"Model weights saved in ./results/checkpoint-36000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-35500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-36500\n",
"Configuration saved in ./results/checkpoint-36500/config.json\n",
"Model weights saved in ./results/checkpoint-36500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-36000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-37000\n",
"Configuration saved in ./results/checkpoint-37000/config.json\n",
"Model weights saved in ./results/checkpoint-37000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-36500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-37500\n",
"Configuration saved in ./results/checkpoint-37500/config.json\n",
"Model weights saved in ./results/checkpoint-37500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-37000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-38000\n",
"Configuration saved in ./results/checkpoint-38000/config.json\n",
"Model weights saved in ./results/checkpoint-38000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-37500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-38500\n",
"Configuration saved in ./results/checkpoint-38500/config.json\n",
"Model weights saved in ./results/checkpoint-38500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-38000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-39000\n",
"Configuration saved in ./results/checkpoint-39000/config.json\n",
"Model weights saved in ./results/checkpoint-39000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-38500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-39500\n",
"Configuration saved in ./results/checkpoint-39500/config.json\n",
"Model weights saved in ./results/checkpoint-39500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-39000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-40000\n",
"Configuration saved in ./results/checkpoint-40000/config.json\n",
"Model weights saved in ./results/checkpoint-40000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-39500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-40500\n",
"Configuration saved in ./results/checkpoint-40500/config.json\n",
"Model weights saved in ./results/checkpoint-40500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-40000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-41000\n",
"Configuration saved in ./results/checkpoint-41000/config.json\n",
"Model weights saved in ./results/checkpoint-41000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-40500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-41500\n",
"Configuration saved in ./results/checkpoint-41500/config.json\n",
"Model weights saved in ./results/checkpoint-41500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-41000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-42000\n",
"Configuration saved in ./results/checkpoint-42000/config.json\n",
"Model weights saved in ./results/checkpoint-42000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-41500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-42500\n",
"Configuration saved in ./results/checkpoint-42500/config.json\n",
"Model weights saved in ./results/checkpoint-42500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-42000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-43000\n",
"Configuration saved in ./results/checkpoint-43000/config.json\n",
"Model weights saved in ./results/checkpoint-43000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-42500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-43500\n",
"Configuration saved in ./results/checkpoint-43500/config.json\n",
"Model weights saved in ./results/checkpoint-43500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-43000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-44000\n",
"Configuration saved in ./results/checkpoint-44000/config.json\n",
"Model weights saved in ./results/checkpoint-44000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-43500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-44500\n",
"Configuration saved in ./results/checkpoint-44500/config.json\n",
"Model weights saved in ./results/checkpoint-44500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-44000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-45000\n",
"Configuration saved in ./results/checkpoint-45000/config.json\n",
"Model weights saved in ./results/checkpoint-45000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-44500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-45500\n",
"Configuration saved in ./results/checkpoint-45500/config.json\n",
"Model weights saved in ./results/checkpoint-45500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-45000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-46000\n",
"Configuration saved in ./results/checkpoint-46000/config.json\n",
"Model weights saved in ./results/checkpoint-46000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-45500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-46500\n",
"Configuration saved in ./results/checkpoint-46500/config.json\n",
"Model weights saved in ./results/checkpoint-46500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-46000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-47000\n",
"Configuration saved in ./results/checkpoint-47000/config.json\n",
"Model weights saved in ./results/checkpoint-47000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-46500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-47500\n",
"Configuration saved in ./results/checkpoint-47500/config.json\n",
"Model weights saved in ./results/checkpoint-47500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-47000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-48000\n",
"Configuration saved in ./results/checkpoint-48000/config.json\n",
"Model weights saved in ./results/checkpoint-48000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-47500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-48500\n",
"Configuration saved in ./results/checkpoint-48500/config.json\n",
"Model weights saved in ./results/checkpoint-48500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-48000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-49000\n",
"Configuration saved in ./results/checkpoint-49000/config.json\n",
"Model weights saved in ./results/checkpoint-49000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-48500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-49500\n",
"Configuration saved in ./results/checkpoint-49500/config.json\n",
"Model weights saved in ./results/checkpoint-49500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-49000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-50000\n",
"Configuration saved in ./results/checkpoint-50000/config.json\n",
"Model weights saved in ./results/checkpoint-50000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-49500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-50500\n",
"Configuration saved in ./results/checkpoint-50500/config.json\n",
"Model weights saved in ./results/checkpoint-50500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-50000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-51000\n",
"Configuration saved in ./results/checkpoint-51000/config.json\n",
"Model weights saved in ./results/checkpoint-51000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-50500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-51500\n",
"Configuration saved in ./results/checkpoint-51500/config.json\n",
"Model weights saved in ./results/checkpoint-51500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-51000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-52000\n",
"Configuration saved in ./results/checkpoint-52000/config.json\n",
"Model weights saved in ./results/checkpoint-52000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-51500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-52500\n",
"Configuration saved in ./results/checkpoint-52500/config.json\n",
"Model weights saved in ./results/checkpoint-52500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-52000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-53000\n",
"Configuration saved in ./results/checkpoint-53000/config.json\n",
"Model weights saved in ./results/checkpoint-53000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-52500] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-53500\n",
"Configuration saved in ./results/checkpoint-53500/config.json\n",
"Model weights saved in ./results/checkpoint-53500/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-53000] due to args.save_total_limit\n",
"Saving model checkpoint to ./results/checkpoint-54000\n",
"Configuration saved in ./results/checkpoint-54000/config.json\n",
"Model weights saved in ./results/checkpoint-54000/pytorch_model.bin\n",
"Deleting older checkpoint [results/checkpoint-53500] due to args.save_total_limit\n",
"\n",
"\n",
"Training completed. Do not forget to share your model on huggingface.co/models =)\n",
"\n",
"\n"
]
},
{
"output_type": "execute_result",
"data": {
"text/plain": [
"TrainOutput(global_step=54297, training_loss=0.537743896358476, metrics={'train_runtime': 1276.4291, 'train_samples_per_second': 680.599, 'train_steps_per_second': 42.538, 'total_flos': 8589565725967872.0, 'train_loss': 0.537743896358476, 'epoch': 3.0})"
]
},
"metadata": {},
"execution_count": 14
}
]
},
{
"cell_type": "code",
"source": [
"x_dev = [x[0] for x in io_read('/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/dev-0/in.tsv.xz')]\n",
"y_dev = [int(y) for y in io_read('/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/dev-0/expected.tsv')]\n",
"# x_test = [x[0] for x in io_read('/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/test-A/in.tsv.xz')]\n",
"dev_encodings = tokenizer(x_dev, truncation=True, padding='max_length', max_length=128)\n",
"dev_dataset = Dataset(dev_encodings, y_dev)"
],
"metadata": {
"id": "8EEK8D_2o9Xa"
},
"execution_count": 15,
"outputs": []
},
{
"cell_type": "code",
"source": [
"dev_predicted = trainer.predict(dev_dataset).predictions"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 92
},
"id": "vHsugxBnT1dt",
"outputId": "d636a78d-5de4-4d7a-eb96-3906fe5b2efd"
},
"execution_count": 21,
"outputs": [
{
"output_type": "stream",
"name": "stderr",
"text": [
"***** Running Prediction *****\n",
" Num examples = 5272\n",
" Batch size = 8\n"
]
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"<IPython.core.display.HTML object>"
],
"text/html": [
"\n",
" <div>\n",
" \n",
" <progress value='1318' max='659' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
" [659/659 02:38]\n",
" </div>\n",
" "
]
},
"metadata": {}
}
]
},
{
"cell_type": "code",
"source": [
"dev_output = ['0' if x > y else '1' for x, y in dev_predicted]"
],
"metadata": {
"id": "vBNcVwM7T_Tu"
},
"execution_count": 22,
"outputs": []
},
{
"cell_type": "code",
"source": [
"io_write(dev_output, '/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/dev-0/out.tsv')"
],
"metadata": {
"id": "r-TmQcY-UCZF"
},
"execution_count": 23,
"outputs": []
},
{
"cell_type": "code",
"source": [
"x_test = [x[0] for x in io_read('/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/test-A/in.tsv.xz')]\n",
"y_test = [0 for x in x_test]\n",
"test_encodings = tokenizer(x_test, truncation=True, padding='max_length', max_length=128)\n",
"test_dataset = Dataset(test_encodings, y_test)\n",
"test_predicted = trainer.predict(test_dataset).predictions\n",
"test_output = ['0' if x > y else '1' for x, y in test_predicted]\n",
"io_write(test_output, '/content/drive/MyDrive/ai-tech/eki/paranormal-or-skeptic/test-A/out.tsv')"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 92
},
"id": "yopL_vgLUQwL",
"outputId": "e10be728-3057-4dbb-a169-8751e8574b15"
},
"execution_count": 24,
"outputs": [
{
"output_type": "stream",
"name": "stderr",
"text": [
"***** Running Prediction *****\n",
" Num examples = 5152\n",
" Batch size = 8\n"
]
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"<IPython.core.display.HTML object>"
],
"text/html": [
"\n",
" <div>\n",
" \n",
" <progress value='1962' max='659' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
" [659/659 04:54]\n",
" </div>\n",
" "
]
},
"metadata": {}
}
]
},
{
"cell_type": "code",
"source": [
""
],
"metadata": {
"id": "iHVk2bWLVEx6"
},
"execution_count": null,
"outputs": []
}
]
}