diff --git a/projekt/FLAN_T5_sms_spam.ipynb b/projekt/FLAN_T5_sms_spam.ipynb
index 68423c7..c3b132a 100644
--- a/projekt/FLAN_T5_sms_spam.ipynb
+++ b/projekt/FLAN_T5_sms_spam.ipynb
@@ -13,10 +13,9 @@
"name": "python"
},
"gpuClass": "standard",
- "accelerator": "GPU",
"widgets": {
"application/vnd.jupyter.widget-state+json": {
- "e4bb6f2f32de48d4b1f6d7ecf97ce376": {
+ "a8e120a9a97d45d59fcf275af25a591e": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -31,14 +30,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_3305b30f1bfa48e9b0c1ba3add06094e",
- "IPY_MODEL_a343619acbb745baa6aa561271ec8815",
- "IPY_MODEL_c493fc54d9eb421f96d6e8519c8a1b0e"
+ "IPY_MODEL_e665879731604133a593e13155f4e03b",
+ "IPY_MODEL_d451aa9d81ca4d5ea901297e702762c0",
+ "IPY_MODEL_a9edac4d193f4930aa691fa496badc64"
],
- "layout": "IPY_MODEL_12fd6daa8e604ecd9ad731b6296815da"
+ "layout": "IPY_MODEL_a21e8fec1d92496a835ae8ad71c287ab"
}
},
- "3305b30f1bfa48e9b0c1ba3add06094e": {
+ "e665879731604133a593e13155f4e03b": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -53,13 +52,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_805f497aa3304353a1be8b4cc87bfb54",
+ "layout": "IPY_MODEL_d168c852a75a43f5addcfbc75c48ec14",
"placeholder": "",
- "style": "IPY_MODEL_594a6d13f81f479eb00fa45fd4094146",
+ "style": "IPY_MODEL_589f9c90c98b48bda9ecb020cb384eab",
"value": "Downloading builder script: 100%"
}
},
- "a343619acbb745baa6aa561271ec8815": {
+ "d451aa9d81ca4d5ea901297e702762c0": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -75,15 +74,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_236979048eb8461f9b7d8c4103905eed",
+ "layout": "IPY_MODEL_e35fb285260b4b86aa9854eac11a6dfd",
"max": 3208,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_4620faf461ca449a88de45e86467e265",
+ "style": "IPY_MODEL_f505b8ea01ff4e2f90edf1d08c5096b1",
"value": 3208
}
},
- "c493fc54d9eb421f96d6e8519c8a1b0e": {
+ "a9edac4d193f4930aa691fa496badc64": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -98,13 +97,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_8dc2f0f2e66741edbccab7abaaf634ce",
+ "layout": "IPY_MODEL_0baf1fcb54e945679e3591276182aa9e",
"placeholder": "",
- "style": "IPY_MODEL_0d49bfb55dfd4090ba57c544eaa97902",
- "value": " 3.21k/3.21k [00:00<00:00, 139kB/s]"
+ "style": "IPY_MODEL_2d57d4b6086e47e1a7d6a9a1375cc49f",
+ "value": " 3.21k/3.21k [00:00<00:00, 82.3kB/s]"
}
},
- "12fd6daa8e604ecd9ad731b6296815da": {
+ "a21e8fec1d92496a835ae8ad71c287ab": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -156,7 +155,7 @@
"width": null
}
},
- "805f497aa3304353a1be8b4cc87bfb54": {
+ "d168c852a75a43f5addcfbc75c48ec14": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -208,7 +207,7 @@
"width": null
}
},
- "594a6d13f81f479eb00fa45fd4094146": {
+ "589f9c90c98b48bda9ecb020cb384eab": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -223,7 +222,7 @@
"description_width": ""
}
},
- "236979048eb8461f9b7d8c4103905eed": {
+ "e35fb285260b4b86aa9854eac11a6dfd": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -275,7 +274,7 @@
"width": null
}
},
- "4620faf461ca449a88de45e86467e265": {
+ "f505b8ea01ff4e2f90edf1d08c5096b1": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -291,7 +290,7 @@
"description_width": ""
}
},
- "8dc2f0f2e66741edbccab7abaaf634ce": {
+ "0baf1fcb54e945679e3591276182aa9e": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -343,7 +342,7 @@
"width": null
}
},
- "0d49bfb55dfd4090ba57c544eaa97902": {
+ "2d57d4b6086e47e1a7d6a9a1375cc49f": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -358,7 +357,7 @@
"description_width": ""
}
},
- "4084f218fca64fc9b765e04d0cc073ac": {
+ "564f30aef6c34efa952fdd1402627d13": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -373,14 +372,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_fec67d95a5904ac199f6648a34ef1ff9",
- "IPY_MODEL_a734d44f6baf4a5f8dfda576c09fffca",
- "IPY_MODEL_3fc2d009da594365854aa11be804b388"
+ "IPY_MODEL_0ee3c4b36db247d09e7fb9e68e856abb",
+ "IPY_MODEL_03ee22d44e2141d99e54bbd59246b328",
+ "IPY_MODEL_19465851c65e445fbaed11e33ac09098"
],
- "layout": "IPY_MODEL_45c7d35932ec44bcb2ccdc73f0ae6b46"
+ "layout": "IPY_MODEL_6a7e920546444da7bf855620f00c45e0"
}
},
- "fec67d95a5904ac199f6648a34ef1ff9": {
+ "0ee3c4b36db247d09e7fb9e68e856abb": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -395,13 +394,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_0c1c3db046f24599b27daa44217f48d2",
+ "layout": "IPY_MODEL_e8b69414b5004f489f5c6793b6cc0746",
"placeholder": "",
- "style": "IPY_MODEL_c3f9ed611a154e22b875d0696ef6022d",
+ "style": "IPY_MODEL_474f0c044be14860b6a38321281d0d1f",
"value": "Downloading metadata: 100%"
}
},
- "a734d44f6baf4a5f8dfda576c09fffca": {
+ "03ee22d44e2141d99e54bbd59246b328": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -417,15 +416,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_7fd51c34909b41a8884fa358cccdbf48",
+ "layout": "IPY_MODEL_f2861641cda34f2786112b28bac2b36f",
"max": 1687,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_9d9edc5471de40c2b7c2b9156637997d",
+ "style": "IPY_MODEL_f07c5cffb60c4a89bb29c49811d73aba",
"value": 1687
}
},
- "3fc2d009da594365854aa11be804b388": {
+ "19465851c65e445fbaed11e33ac09098": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -440,13 +439,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_02c64bf3ff95438cb43c7dc52034cc43",
+ "layout": "IPY_MODEL_e502595b7e6b45498d2018e62e6fa6f2",
"placeholder": "",
- "style": "IPY_MODEL_f0b71ecb6b1c4d1190ca899af7d3e82c",
- "value": " 1.69k/1.69k [00:00<00:00, 37.7kB/s]"
+ "style": "IPY_MODEL_80b9042089364fae8e0cffc7a49203c1",
+ "value": " 1.69k/1.69k [00:00<00:00, 43.9kB/s]"
}
},
- "45c7d35932ec44bcb2ccdc73f0ae6b46": {
+ "6a7e920546444da7bf855620f00c45e0": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -498,7 +497,7 @@
"width": null
}
},
- "0c1c3db046f24599b27daa44217f48d2": {
+ "e8b69414b5004f489f5c6793b6cc0746": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -550,7 +549,7 @@
"width": null
}
},
- "c3f9ed611a154e22b875d0696ef6022d": {
+ "474f0c044be14860b6a38321281d0d1f": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -565,7 +564,7 @@
"description_width": ""
}
},
- "7fd51c34909b41a8884fa358cccdbf48": {
+ "f2861641cda34f2786112b28bac2b36f": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -617,7 +616,7 @@
"width": null
}
},
- "9d9edc5471de40c2b7c2b9156637997d": {
+ "f07c5cffb60c4a89bb29c49811d73aba": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -633,7 +632,7 @@
"description_width": ""
}
},
- "02c64bf3ff95438cb43c7dc52034cc43": {
+ "e502595b7e6b45498d2018e62e6fa6f2": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -685,7 +684,7 @@
"width": null
}
},
- "f0b71ecb6b1c4d1190ca899af7d3e82c": {
+ "80b9042089364fae8e0cffc7a49203c1": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -700,7 +699,7 @@
"description_width": ""
}
},
- "8cae9c49e18f43248072b5e059429f6d": {
+ "ae89e755c6e64ab2a3101913d08820ef": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -715,14 +714,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_88c8adca128b44c1bbbec437630c2074",
- "IPY_MODEL_0f73f5e2c8af41eaae5f1c27f212da8b",
- "IPY_MODEL_255b4480e11f4b3e892a5d2dc6abfd4b"
+ "IPY_MODEL_5181e91045d240308e1371af2a560d56",
+ "IPY_MODEL_3551b2e33fac44f38988c07fc5819b23",
+ "IPY_MODEL_9a418f8782a842898d730f8cbc4fe311"
],
- "layout": "IPY_MODEL_a96eab6312f6447b9eff3f914c5a6827"
+ "layout": "IPY_MODEL_c9d1c36d765345e183d4cdf911ad07b3"
}
},
- "88c8adca128b44c1bbbec437630c2074": {
+ "5181e91045d240308e1371af2a560d56": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -737,13 +736,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_063059d53dc942d1aee9e3fe2f27687d",
+ "layout": "IPY_MODEL_75a75524abc04743a7533f9030769bb2",
"placeholder": "",
- "style": "IPY_MODEL_ca50704df2cc430fae6b5902c5399414",
+ "style": "IPY_MODEL_84e9b5aef48c4d429742d0fde6fc125e",
"value": "Downloading readme: 100%"
}
},
- "0f73f5e2c8af41eaae5f1c27f212da8b": {
+ "3551b2e33fac44f38988c07fc5819b23": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -759,15 +758,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_64f5cdd8d1c14be79278ee4de89993d1",
+ "layout": "IPY_MODEL_24492355887d405b98f8f42c4be836b6",
"max": 4872,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_f065dcd7d1d34cb6806f2eb28bb3cd6f",
+ "style": "IPY_MODEL_5c7cbcd333f145488ab9411512467c19",
"value": 4872
}
},
- "255b4480e11f4b3e892a5d2dc6abfd4b": {
+ "9a418f8782a842898d730f8cbc4fe311": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -782,13 +781,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_67663505c87640b58e04d3ce028537ea",
+ "layout": "IPY_MODEL_6cc08744eb594bbc913da9fc2a15c939",
"placeholder": "",
- "style": "IPY_MODEL_f5a17bc6f9f94b2ca119528b0ca2d456",
- "value": " 4.87k/4.87k [00:00<00:00, 116kB/s]"
+ "style": "IPY_MODEL_17c7c64eafb14d168bd386cae79902aa",
+ "value": " 4.87k/4.87k [00:00<00:00, 82.7kB/s]"
}
},
- "a96eab6312f6447b9eff3f914c5a6827": {
+ "c9d1c36d765345e183d4cdf911ad07b3": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -840,7 +839,7 @@
"width": null
}
},
- "063059d53dc942d1aee9e3fe2f27687d": {
+ "75a75524abc04743a7533f9030769bb2": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -892,7 +891,7 @@
"width": null
}
},
- "ca50704df2cc430fae6b5902c5399414": {
+ "84e9b5aef48c4d429742d0fde6fc125e": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -907,7 +906,7 @@
"description_width": ""
}
},
- "64f5cdd8d1c14be79278ee4de89993d1": {
+ "24492355887d405b98f8f42c4be836b6": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -959,7 +958,7 @@
"width": null
}
},
- "f065dcd7d1d34cb6806f2eb28bb3cd6f": {
+ "5c7cbcd333f145488ab9411512467c19": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -975,7 +974,7 @@
"description_width": ""
}
},
- "67663505c87640b58e04d3ce028537ea": {
+ "6cc08744eb594bbc913da9fc2a15c939": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1027,7 +1026,7 @@
"width": null
}
},
- "f5a17bc6f9f94b2ca119528b0ca2d456": {
+ "17c7c64eafb14d168bd386cae79902aa": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -1042,7 +1041,7 @@
"description_width": ""
}
},
- "ec0f16c3cbb14d9287e148887127219b": {
+ "db79fbdb9e25432a8f95221cc0bed971": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -1057,14 +1056,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_ba832204e1d4413f8b8a15e10bac7d95",
- "IPY_MODEL_8179dbec98b7466ea2195affb0568498",
- "IPY_MODEL_7e9abda7b55c459b8a9888edaf1cc116"
+ "IPY_MODEL_3c14418eb66d4392bcaa64ca3394084c",
+ "IPY_MODEL_3144d6d798df44afacc4f34bed90f0e4",
+ "IPY_MODEL_9259558984d847ae99435ef4e312e3b7"
],
- "layout": "IPY_MODEL_64c8860ae16848af9b04bb41955a8446"
+ "layout": "IPY_MODEL_1b05d118f33949dfa5daf732520f9c62"
}
},
- "ba832204e1d4413f8b8a15e10bac7d95": {
+ "3c14418eb66d4392bcaa64ca3394084c": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -1079,13 +1078,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_64fe250082bf4d4fb126a319920d2f0a",
+ "layout": "IPY_MODEL_dc652b3692ed4da6b3fd959acb773b66",
"placeholder": "",
- "style": "IPY_MODEL_0b278b6f5da94921afbacb873c15d9c9",
+ "style": "IPY_MODEL_ce7027fdd804415db2c60560be3c66e9",
"value": "Downloading data: 100%"
}
},
- "8179dbec98b7466ea2195affb0568498": {
+ "3144d6d798df44afacc4f34bed90f0e4": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -1101,15 +1100,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_b688bc7f34e941488831da5d4aed9396",
+ "layout": "IPY_MODEL_3ab3add96759441eba1571795b0edaae",
"max": 203415,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_44cec66cbaeb49abb26dbfc5420ceacb",
+ "style": "IPY_MODEL_d88268e0bb52404e86a37b01fdac5957",
"value": 203415
}
},
- "7e9abda7b55c459b8a9888edaf1cc116": {
+ "9259558984d847ae99435ef4e312e3b7": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -1124,13 +1123,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_67a750dcfa8b44499956572fda3dbacf",
+ "layout": "IPY_MODEL_dae3457866114776818227ec44284ced",
"placeholder": "",
- "style": "IPY_MODEL_edad6f2eb6704468bd06006c50697f86",
- "value": " 203k/203k [00:00<00:00, 171kB/s]"
+ "style": "IPY_MODEL_2aab0424351e4b9594cdcf631632c690",
+ "value": " 203k/203k [00:00<00:00, 400kB/s]"
}
},
- "64c8860ae16848af9b04bb41955a8446": {
+ "1b05d118f33949dfa5daf732520f9c62": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1182,7 +1181,7 @@
"width": null
}
},
- "64fe250082bf4d4fb126a319920d2f0a": {
+ "dc652b3692ed4da6b3fd959acb773b66": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1234,7 +1233,7 @@
"width": null
}
},
- "0b278b6f5da94921afbacb873c15d9c9": {
+ "ce7027fdd804415db2c60560be3c66e9": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -1249,7 +1248,7 @@
"description_width": ""
}
},
- "b688bc7f34e941488831da5d4aed9396": {
+ "3ab3add96759441eba1571795b0edaae": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1301,7 +1300,7 @@
"width": null
}
},
- "44cec66cbaeb49abb26dbfc5420ceacb": {
+ "d88268e0bb52404e86a37b01fdac5957": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -1317,7 +1316,7 @@
"description_width": ""
}
},
- "67a750dcfa8b44499956572fda3dbacf": {
+ "dae3457866114776818227ec44284ced": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1369,7 +1368,7 @@
"width": null
}
},
- "edad6f2eb6704468bd06006c50697f86": {
+ "2aab0424351e4b9594cdcf631632c690": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -1384,7 +1383,7 @@
"description_width": ""
}
},
- "699a1bdf38ca48e2affc3c6bd771852f": {
+ "6fd330314de74ccc983da44783bcac7d": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -1399,14 +1398,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_4e5a92d4acdc43d487290ffd8a842ea5",
- "IPY_MODEL_8bc8c44b6324478a8209094f9b7e9ccd",
- "IPY_MODEL_e95f31e693674a0aae8de0e167a49daf"
+ "IPY_MODEL_209778054761411190cf91741a43b2d3",
+ "IPY_MODEL_5d45d48713924a8d805368867c7bb5e0",
+ "IPY_MODEL_fa0715f8876c401ba6a2681d0abf7e5a"
],
- "layout": "IPY_MODEL_069a68aed2bb4d37a00c9c0feedd3e17"
+ "layout": "IPY_MODEL_b6afff9e8ee44d42814dc84670ed999f"
}
},
- "4e5a92d4acdc43d487290ffd8a842ea5": {
+ "209778054761411190cf91741a43b2d3": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -1421,13 +1420,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_9930f171a6db47939e996016cb49fe20",
+ "layout": "IPY_MODEL_7b636bb9a4724d2783148aa8d6aa791e",
"placeholder": "",
- "style": "IPY_MODEL_ddd0c0abba074aa7a33b5c825ccf8760",
- "value": "Generating train split: 100%"
+ "style": "IPY_MODEL_dd488415b19349d8a5306153907ba902",
+ "value": "Generating train split: 89%"
}
},
- "8bc8c44b6324478a8209094f9b7e9ccd": {
+ "5d45d48713924a8d805368867c7bb5e0": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -1443,15 +1442,15 @@
"bar_style": "",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_8bbb7307312648b0afb901f701a4e466",
+ "layout": "IPY_MODEL_174930418d51405f969eaa6b5aa67dde",
"max": 5574,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_4a2eb48d3583446598fdd1b7175c96fd",
+ "style": "IPY_MODEL_75f8a0de12974b84a4b8bde1a16c33c4",
"value": 5574
}
},
- "e95f31e693674a0aae8de0e167a49daf": {
+ "fa0715f8876c401ba6a2681d0abf7e5a": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -1466,13 +1465,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_b3eae90c5aea409ab1a2c541948658f8",
+ "layout": "IPY_MODEL_101281b2ecf441a39abc9d4e49398e43",
"placeholder": "",
- "style": "IPY_MODEL_41b5186c2e194402a1e18f1c1a9f18a4",
- "value": " 5574/5574 [00:12<00:00, 7617.98 examples/s]"
+ "style": "IPY_MODEL_20ad8bc6a1c94be090190ea3de64a10f",
+ "value": " 4957/5574 [00:00<00:00, 8825.97 examples/s]"
}
},
- "069a68aed2bb4d37a00c9c0feedd3e17": {
+ "b6afff9e8ee44d42814dc84670ed999f": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1524,7 +1523,7 @@
"width": null
}
},
- "9930f171a6db47939e996016cb49fe20": {
+ "7b636bb9a4724d2783148aa8d6aa791e": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1576,7 +1575,7 @@
"width": null
}
},
- "ddd0c0abba074aa7a33b5c825ccf8760": {
+ "dd488415b19349d8a5306153907ba902": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -1591,7 +1590,7 @@
"description_width": ""
}
},
- "8bbb7307312648b0afb901f701a4e466": {
+ "174930418d51405f969eaa6b5aa67dde": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1643,7 +1642,7 @@
"width": null
}
},
- "4a2eb48d3583446598fdd1b7175c96fd": {
+ "75f8a0de12974b84a4b8bde1a16c33c4": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -1659,7 +1658,7 @@
"description_width": ""
}
},
- "b3eae90c5aea409ab1a2c541948658f8": {
+ "101281b2ecf441a39abc9d4e49398e43": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1711,7 +1710,7 @@
"width": null
}
},
- "41b5186c2e194402a1e18f1c1a9f18a4": {
+ "20ad8bc6a1c94be090190ea3de64a10f": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -1726,7 +1725,7 @@
"description_width": ""
}
},
- "3c84850ebe3e45d297d3bfa8a12f1b86": {
+ "99cbe58514e3460398f032b93a57d068": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -1741,14 +1740,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_8a5f71a073ca4b0cb929ba3cf31fd296",
- "IPY_MODEL_b5be73849b61415fb9187d011261be1e",
- "IPY_MODEL_46a51fbd984344b1958889c608ea04ed"
+ "IPY_MODEL_797dcecef4874b9f8de64e643661c637",
+ "IPY_MODEL_9d97e656e72d4f99a2b4669e811918cd",
+ "IPY_MODEL_df4a5058866c4ec8875cfb5189c738c5"
],
- "layout": "IPY_MODEL_0d25092adebd4f94b1799df263ccaf55"
+ "layout": "IPY_MODEL_fcd408ec35cd44f1b7309931256adfaa"
}
},
- "8a5f71a073ca4b0cb929ba3cf31fd296": {
+ "797dcecef4874b9f8de64e643661c637": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -1763,13 +1762,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_e4814d2ee2df4f6a9f411b134ebca546",
+ "layout": "IPY_MODEL_2ab3431929a540609d0edac159d63d41",
"placeholder": "",
- "style": "IPY_MODEL_09669f6ac72b45689e082b4fb489a23f",
+ "style": "IPY_MODEL_fa0e9bb620c04cca998be8929f50c4d8",
"value": "100%"
}
},
- "b5be73849b61415fb9187d011261be1e": {
+ "9d97e656e72d4f99a2b4669e811918cd": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -1785,15 +1784,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_7afda94f85794acf882856b760a3eb63",
+ "layout": "IPY_MODEL_4d131181a5fa4f0880946ef5cd984790",
"max": 1,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_a70df5e47adb4a4d8b80a543dedfd708",
+ "style": "IPY_MODEL_2f3024af40c346a188793eeddff5848b",
"value": 1
}
},
- "46a51fbd984344b1958889c608ea04ed": {
+ "df4a5058866c4ec8875cfb5189c738c5": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -1808,13 +1807,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_140058b69379422797bdc22374192bd6",
+ "layout": "IPY_MODEL_914ceee224b244b9ac0492305fb1fb24",
"placeholder": "",
- "style": "IPY_MODEL_8aabd23e2fa242e4b8cf4ef43fbebe2e",
- "value": " 1/1 [00:00<00:00, 13.35it/s]"
+ "style": "IPY_MODEL_5e394d73c2df4d34b39989cd1b24dc57",
+ "value": " 1/1 [00:00<00:00, 24.99it/s]"
}
},
- "0d25092adebd4f94b1799df263ccaf55": {
+ "fcd408ec35cd44f1b7309931256adfaa": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1866,7 +1865,7 @@
"width": null
}
},
- "e4814d2ee2df4f6a9f411b134ebca546": {
+ "2ab3431929a540609d0edac159d63d41": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1918,7 +1917,7 @@
"width": null
}
},
- "09669f6ac72b45689e082b4fb489a23f": {
+ "fa0e9bb620c04cca998be8929f50c4d8": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -1933,7 +1932,7 @@
"description_width": ""
}
},
- "7afda94f85794acf882856b760a3eb63": {
+ "4d131181a5fa4f0880946ef5cd984790": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -1985,7 +1984,7 @@
"width": null
}
},
- "a70df5e47adb4a4d8b80a543dedfd708": {
+ "2f3024af40c346a188793eeddff5848b": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -2001,7 +2000,7 @@
"description_width": ""
}
},
- "140058b69379422797bdc22374192bd6": {
+ "914ceee224b244b9ac0492305fb1fb24": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2053,7 +2052,7 @@
"width": null
}
},
- "8aabd23e2fa242e4b8cf4ef43fbebe2e": {
+ "5e394d73c2df4d34b39989cd1b24dc57": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -2068,7 +2067,7 @@
"description_width": ""
}
},
- "040698c1b4be4adebfe751751a64c11d": {
+ "6fb269ceeada49c19adf46819664fa98": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -2083,14 +2082,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_11b4ddede4494fe093329c50097b7df5",
- "IPY_MODEL_7986c625c9c34d039fad240333d0da08",
- "IPY_MODEL_b35a6f8e81184f81990a0111cc5c6ca8"
+ "IPY_MODEL_341f67fcddff4a91813fb1331fd63c3e",
+ "IPY_MODEL_33c7a0d0629342288601999a3b11d71c",
+ "IPY_MODEL_87d7f2540c724ba88b6f972049043702"
],
- "layout": "IPY_MODEL_2968992398a94adeb626eec2f45a8699"
+ "layout": "IPY_MODEL_36111c073ea34489886c767532713233"
}
},
- "11b4ddede4494fe093329c50097b7df5": {
+ "341f67fcddff4a91813fb1331fd63c3e": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -2105,13 +2104,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_c9f8f67483fb45c8a6b59fceae40fe42",
+ "layout": "IPY_MODEL_c05a5532720d47e39e6cb710617aab67",
"placeholder": "",
- "style": "IPY_MODEL_c5a862e7d71c430c865fa87dc21b1f6d",
+ "style": "IPY_MODEL_458619b05af848fe8f40fac408e4c521",
"value": "Downloading (…)okenizer_config.json: 100%"
}
},
- "7986c625c9c34d039fad240333d0da08": {
+ "33c7a0d0629342288601999a3b11d71c": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -2127,15 +2126,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_d69171bdd6544c8ab9e96f3f3dfe7f92",
+ "layout": "IPY_MODEL_3cf20c5c605b46e1bc4890769cdeffe3",
"max": 2537,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_9cca59c67c5f452eb1d9e8dd22296968",
+ "style": "IPY_MODEL_15c19b89e55243cc88e77c56895d56b4",
"value": 2537
}
},
- "b35a6f8e81184f81990a0111cc5c6ca8": {
+ "87d7f2540c724ba88b6f972049043702": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -2150,13 +2149,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_0f18ab0690ce4bc3b9b7c2f4d10c2049",
+ "layout": "IPY_MODEL_b4dd2e86dd6a4d579f315293d4b0ba21",
"placeholder": "",
- "style": "IPY_MODEL_af26b98c1e3440daa11e104ed1c8b7e4",
- "value": " 2.54k/2.54k [00:00<00:00, 97.2kB/s]"
+ "style": "IPY_MODEL_60577d05c1ad4acea832bd4e34efa6f4",
+ "value": " 2.54k/2.54k [00:00<00:00, 102kB/s]"
}
},
- "2968992398a94adeb626eec2f45a8699": {
+ "36111c073ea34489886c767532713233": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2208,7 +2207,7 @@
"width": null
}
},
- "c9f8f67483fb45c8a6b59fceae40fe42": {
+ "c05a5532720d47e39e6cb710617aab67": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2260,7 +2259,7 @@
"width": null
}
},
- "c5a862e7d71c430c865fa87dc21b1f6d": {
+ "458619b05af848fe8f40fac408e4c521": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -2275,7 +2274,7 @@
"description_width": ""
}
},
- "d69171bdd6544c8ab9e96f3f3dfe7f92": {
+ "3cf20c5c605b46e1bc4890769cdeffe3": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2327,7 +2326,7 @@
"width": null
}
},
- "9cca59c67c5f452eb1d9e8dd22296968": {
+ "15c19b89e55243cc88e77c56895d56b4": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -2343,7 +2342,7 @@
"description_width": ""
}
},
- "0f18ab0690ce4bc3b9b7c2f4d10c2049": {
+ "b4dd2e86dd6a4d579f315293d4b0ba21": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2395,7 +2394,7 @@
"width": null
}
},
- "af26b98c1e3440daa11e104ed1c8b7e4": {
+ "60577d05c1ad4acea832bd4e34efa6f4": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -2410,7 +2409,7 @@
"description_width": ""
}
},
- "be9060616d68475ea2e4674f7e460566": {
+ "4f67d0fe28914c1bb3d1057225c409cd": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -2425,14 +2424,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_264afd978de54dbeaa1b711e4c0b1c07",
- "IPY_MODEL_bbcefda6eea74b8ea8313e4f7167df65",
- "IPY_MODEL_68d85f6957ea4807a1fe7c82c9a7bc06"
+ "IPY_MODEL_f384fc9cd7f2428fad3b6d10ffac7efd",
+ "IPY_MODEL_36838c7736594b1b83f3046c8f0cc265",
+ "IPY_MODEL_b98e34b842054f99ae1ac5f96104321f"
],
- "layout": "IPY_MODEL_cdfaf060f34a4d23afe97243d5f4c709"
+ "layout": "IPY_MODEL_a4ce8092283747e89e730a7e39e64834"
}
},
- "264afd978de54dbeaa1b711e4c0b1c07": {
+ "f384fc9cd7f2428fad3b6d10ffac7efd": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -2447,13 +2446,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_9411023294ab44b284894aebf3f8f589",
+ "layout": "IPY_MODEL_0aa55ed422a94e94b01c117598842a10",
"placeholder": "",
- "style": "IPY_MODEL_d8bf78a3d7ea47a9824d6e01e70b0237",
+ "style": "IPY_MODEL_d54619fbb71e441eb90d9c42145ba07b",
"value": "Downloading (…)"spiece.model";: 100%"
}
},
- "bbcefda6eea74b8ea8313e4f7167df65": {
+ "36838c7736594b1b83f3046c8f0cc265": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -2469,15 +2468,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_b95ece9507db467fad710338bdf29177",
+ "layout": "IPY_MODEL_da3487b705264da9a8f92254e568b76e",
"max": 791656,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_34a31746a99c4916b1402a2829e71a98",
+ "style": "IPY_MODEL_9f378f21d7804f49ad9f72ccabb4a10b",
"value": 791656
}
},
- "68d85f6957ea4807a1fe7c82c9a7bc06": {
+ "b98e34b842054f99ae1ac5f96104321f": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -2492,13 +2491,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_29b2a7a233a9484c92056034cc70b8ca",
+ "layout": "IPY_MODEL_ebb15c7aaf1d4b59a2186e2abbea2868",
"placeholder": "",
- "style": "IPY_MODEL_c9a72e2599e94e9e9bc2b4912d25877b",
- "value": " 792k/792k [00:00<00:00, 19.7MB/s]"
+ "style": "IPY_MODEL_6510cda1ab33418882a1e6811f826ed4",
+ "value": " 792k/792k [00:00<00:00, 9.67MB/s]"
}
},
- "cdfaf060f34a4d23afe97243d5f4c709": {
+ "a4ce8092283747e89e730a7e39e64834": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2550,7 +2549,7 @@
"width": null
}
},
- "9411023294ab44b284894aebf3f8f589": {
+ "0aa55ed422a94e94b01c117598842a10": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2602,7 +2601,7 @@
"width": null
}
},
- "d8bf78a3d7ea47a9824d6e01e70b0237": {
+ "d54619fbb71e441eb90d9c42145ba07b": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -2617,7 +2616,7 @@
"description_width": ""
}
},
- "b95ece9507db467fad710338bdf29177": {
+ "da3487b705264da9a8f92254e568b76e": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2669,7 +2668,7 @@
"width": null
}
},
- "34a31746a99c4916b1402a2829e71a98": {
+ "9f378f21d7804f49ad9f72ccabb4a10b": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -2685,7 +2684,7 @@
"description_width": ""
}
},
- "29b2a7a233a9484c92056034cc70b8ca": {
+ "ebb15c7aaf1d4b59a2186e2abbea2868": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2737,7 +2736,7 @@
"width": null
}
},
- "c9a72e2599e94e9e9bc2b4912d25877b": {
+ "6510cda1ab33418882a1e6811f826ed4": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -2752,7 +2751,7 @@
"description_width": ""
}
},
- "2c24af439f3e45db8a0e004686e912ed": {
+ "0b3c6eb43a5c4644adbc17ee2b06b079": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -2767,14 +2766,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_dcb13b35232145fd85be1b6e4442cc5a",
- "IPY_MODEL_58037f9984bb414a9c6e56337d86215c",
- "IPY_MODEL_6e9379baaf2049658790e176ca279531"
+ "IPY_MODEL_fcb7ce49c0c14dc4a5dbbd9870334921",
+ "IPY_MODEL_2f58b16a741f4f1d822c71c17a1c5606",
+ "IPY_MODEL_35cbd0d168714ecc9f0c9236b3707d0a"
],
- "layout": "IPY_MODEL_772e39d516cf43fdbb1b3db001d53d77"
+ "layout": "IPY_MODEL_b9393265011640c493b2bd4de43a4aef"
}
},
- "dcb13b35232145fd85be1b6e4442cc5a": {
+ "fcb7ce49c0c14dc4a5dbbd9870334921": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -2789,13 +2788,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_c08c1e0783324c53b7fc02912fa14af9",
+ "layout": "IPY_MODEL_eaeeca2372be4fe3868d2d3f42839bc2",
"placeholder": "",
- "style": "IPY_MODEL_9bcdda510c0147178f651b66450b48ac",
+ "style": "IPY_MODEL_079b78ca1493431880754da6fc4ac127",
"value": "Downloading (…)/main/tokenizer.json: 100%"
}
},
- "58037f9984bb414a9c6e56337d86215c": {
+ "2f58b16a741f4f1d822c71c17a1c5606": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -2811,15 +2810,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_18ab5e8088e04cdca93df7519156a59f",
+ "layout": "IPY_MODEL_6c7e4ab3930c4570a05a4e3d9db6782d",
"max": 2424064,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_f502a26154d840b89b5c61a2aae4f827",
+ "style": "IPY_MODEL_2ae3b00d50f04990b8c1839dfa705dc8",
"value": 2424064
}
},
- "6e9379baaf2049658790e176ca279531": {
+ "35cbd0d168714ecc9f0c9236b3707d0a": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -2834,13 +2833,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_7beb993a979443dcb93d26ec6e6718c3",
+ "layout": "IPY_MODEL_cfcae44ed5734d7086ecb5028281cf9a",
"placeholder": "",
- "style": "IPY_MODEL_62e60fc862054e4d8d0d18cb1957cf6d",
- "value": " 2.42M/2.42M [00:01<00:00, 1.56MB/s]"
+ "style": "IPY_MODEL_281ca6dc827f41d3833ba1c60606529d",
+ "value": " 2.42M/2.42M [00:00<00:00, 3.93MB/s]"
}
},
- "772e39d516cf43fdbb1b3db001d53d77": {
+ "b9393265011640c493b2bd4de43a4aef": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2892,7 +2891,7 @@
"width": null
}
},
- "c08c1e0783324c53b7fc02912fa14af9": {
+ "eaeeca2372be4fe3868d2d3f42839bc2": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -2944,7 +2943,7 @@
"width": null
}
},
- "9bcdda510c0147178f651b66450b48ac": {
+ "079b78ca1493431880754da6fc4ac127": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -2959,7 +2958,7 @@
"description_width": ""
}
},
- "18ab5e8088e04cdca93df7519156a59f": {
+ "6c7e4ab3930c4570a05a4e3d9db6782d": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3011,7 +3010,7 @@
"width": null
}
},
- "f502a26154d840b89b5c61a2aae4f827": {
+ "2ae3b00d50f04990b8c1839dfa705dc8": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -3027,7 +3026,7 @@
"description_width": ""
}
},
- "7beb993a979443dcb93d26ec6e6718c3": {
+ "cfcae44ed5734d7086ecb5028281cf9a": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3079,7 +3078,7 @@
"width": null
}
},
- "62e60fc862054e4d8d0d18cb1957cf6d": {
+ "281ca6dc827f41d3833ba1c60606529d": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -3094,7 +3093,7 @@
"description_width": ""
}
},
- "bd697213d4fa4c1d9119657c537e78fe": {
+ "bce6a704b2924287b8b9279d791b633b": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -3109,14 +3108,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_67f9f97815354675bf3bd435f2ed0436",
- "IPY_MODEL_27bd6c78e7f74ff385509e9856c2b8d0",
- "IPY_MODEL_34f670acaa3542eebc8c19018e900ce3"
+ "IPY_MODEL_b1dae5dc568446b0ba896b3abe3afb49",
+ "IPY_MODEL_29ff3a3e656a489182943da91cd73813",
+ "IPY_MODEL_585cf66f9f3648e0b950ca04eb17cc63"
],
- "layout": "IPY_MODEL_ec2d082874844b6daf8542824bfde1a0"
+ "layout": "IPY_MODEL_71e629333d5d4009bc8072b9f12c0cee"
}
},
- "67f9f97815354675bf3bd435f2ed0436": {
+ "b1dae5dc568446b0ba896b3abe3afb49": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -3131,13 +3130,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_b9df5fc8959447449d873bd17e6696f7",
+ "layout": "IPY_MODEL_d5438b0c54104ddd99ed097fa65bc21c",
"placeholder": "",
- "style": "IPY_MODEL_f8489ecaa1a844369bcb427c5f4c95e6",
+ "style": "IPY_MODEL_224c2c07bdc5444aaddf46ca6325e681",
"value": "Downloading (…)cial_tokens_map.json: 100%"
}
},
- "27bd6c78e7f74ff385509e9856c2b8d0": {
+ "29ff3a3e656a489182943da91cd73813": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -3153,15 +3152,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_b21e65a9dff040f4a045580d9989ac20",
+ "layout": "IPY_MODEL_197d80f118764b65b29ad5049edd0087",
"max": 2201,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_0efa19170c9e4de891e328365543c916",
+ "style": "IPY_MODEL_e0326b59a1334117bbe6ccb06c1f4020",
"value": 2201
}
},
- "34f670acaa3542eebc8c19018e900ce3": {
+ "585cf66f9f3648e0b950ca04eb17cc63": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -3176,13 +3175,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_8c6fa802ddd5491581c092e5422bfeab",
+ "layout": "IPY_MODEL_6fd86b989a354a2696c8b9e880109a95",
"placeholder": "",
- "style": "IPY_MODEL_42cfc2ada7ac408fab39251add66f6ef",
- "value": " 2.20k/2.20k [00:00<00:00, 67.2kB/s]"
+ "style": "IPY_MODEL_2caff09a31ad46f59e717e25462b12d6",
+ "value": " 2.20k/2.20k [00:00<00:00, 125kB/s]"
}
},
- "ec2d082874844b6daf8542824bfde1a0": {
+ "71e629333d5d4009bc8072b9f12c0cee": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3234,7 +3233,7 @@
"width": null
}
},
- "b9df5fc8959447449d873bd17e6696f7": {
+ "d5438b0c54104ddd99ed097fa65bc21c": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3286,7 +3285,7 @@
"width": null
}
},
- "f8489ecaa1a844369bcb427c5f4c95e6": {
+ "224c2c07bdc5444aaddf46ca6325e681": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -3301,7 +3300,7 @@
"description_width": ""
}
},
- "b21e65a9dff040f4a045580d9989ac20": {
+ "197d80f118764b65b29ad5049edd0087": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3353,7 +3352,7 @@
"width": null
}
},
- "0efa19170c9e4de891e328365543c916": {
+ "e0326b59a1334117bbe6ccb06c1f4020": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -3369,7 +3368,7 @@
"description_width": ""
}
},
- "8c6fa802ddd5491581c092e5422bfeab": {
+ "6fd86b989a354a2696c8b9e880109a95": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3421,7 +3420,7 @@
"width": null
}
},
- "42cfc2ada7ac408fab39251add66f6ef": {
+ "2caff09a31ad46f59e717e25462b12d6": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -3436,7 +3435,7 @@
"description_width": ""
}
},
- "3747d0aa68d642449ff32b7efd47d497": {
+ "8e60f2b1a9f7455db02eb846af52df63": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -3451,14 +3450,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_2a84ccf3660a4e24b37bfc1d952f06d9",
- "IPY_MODEL_43b98452768846eb9b773839a4681cc6",
- "IPY_MODEL_2dfbcef644a84b558ce99b2ddaf091b6"
+ "IPY_MODEL_71ff180cc81a4376b6a27455ed5cba26",
+ "IPY_MODEL_4dc7c026d3e5469da3ada03bf77d7019",
+ "IPY_MODEL_279308acf5be418ab7f25c3501739c9d"
],
- "layout": "IPY_MODEL_9dd02373a1994433a49e0015b76dd858"
+ "layout": "IPY_MODEL_5c4c0f7bfb6c4a518cdfd3f1d70e77d5"
}
},
- "2a84ccf3660a4e24b37bfc1d952f06d9": {
+ "71ff180cc81a4376b6a27455ed5cba26": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -3473,13 +3472,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_42a620dfccb4416c95fbd7a76637dc73",
+ "layout": "IPY_MODEL_7182f8c40174456db2d6f974e1a672a9",
"placeholder": "",
- "style": "IPY_MODEL_9d953b41e24c4263b18e1ff2174eb797",
+ "style": "IPY_MODEL_f34bf1f4156b4dec8990f16cbceccb00",
"value": "Downloading (…)lve/main/config.json: 100%"
}
},
- "43b98452768846eb9b773839a4681cc6": {
+ "4dc7c026d3e5469da3ada03bf77d7019": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -3495,15 +3494,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_cb409960af114fa690bac72c1d51d2ab",
+ "layout": "IPY_MODEL_bcf3f636355347338e1d57c191e2349f",
"max": 1404,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_995a94c35b4c441b86598d1976281711",
+ "style": "IPY_MODEL_e36598bd61874b4eb737d248df7c1212",
"value": 1404
}
},
- "2dfbcef644a84b558ce99b2ddaf091b6": {
+ "279308acf5be418ab7f25c3501739c9d": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -3518,13 +3517,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_4ea2ccb5fa264dd5a042f570c22db7de",
+ "layout": "IPY_MODEL_f9c113d3c4f64aee969c897451b4522e",
"placeholder": "",
- "style": "IPY_MODEL_4d5668e5b66d4993b935b077a1dc281c",
- "value": " 1.40k/1.40k [00:00<00:00, 54.0kB/s]"
+ "style": "IPY_MODEL_fc647c0c0bd14b87b59d539db3793d0a",
+ "value": " 1.40k/1.40k [00:00<00:00, 24.5kB/s]"
}
},
- "9dd02373a1994433a49e0015b76dd858": {
+ "5c4c0f7bfb6c4a518cdfd3f1d70e77d5": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3576,7 +3575,7 @@
"width": null
}
},
- "42a620dfccb4416c95fbd7a76637dc73": {
+ "7182f8c40174456db2d6f974e1a672a9": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3628,7 +3627,7 @@
"width": null
}
},
- "9d953b41e24c4263b18e1ff2174eb797": {
+ "f34bf1f4156b4dec8990f16cbceccb00": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -3643,7 +3642,7 @@
"description_width": ""
}
},
- "cb409960af114fa690bac72c1d51d2ab": {
+ "bcf3f636355347338e1d57c191e2349f": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3695,7 +3694,7 @@
"width": null
}
},
- "995a94c35b4c441b86598d1976281711": {
+ "e36598bd61874b4eb737d248df7c1212": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -3711,7 +3710,7 @@
"description_width": ""
}
},
- "4ea2ccb5fa264dd5a042f570c22db7de": {
+ "f9c113d3c4f64aee969c897451b4522e": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3763,7 +3762,7 @@
"width": null
}
},
- "4d5668e5b66d4993b935b077a1dc281c": {
+ "fc647c0c0bd14b87b59d539db3793d0a": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -3778,7 +3777,7 @@
"description_width": ""
}
},
- "cf36c750119449e8a16aa97a9b66a124": {
+ "3fcb6b4a0c454d59a6d5503cec84ba37": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -3793,14 +3792,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_0de691bf20804830ba5e6710c205c9ac",
- "IPY_MODEL_7ee532c002784554b12fede964c6c05a",
- "IPY_MODEL_25e5c76c84a8414495b61663250825aa"
+ "IPY_MODEL_17d4993dc58949ca87a852e7e6c02e0c",
+ "IPY_MODEL_db24a85aa3e24a2c9275b9aa4ac78faa",
+ "IPY_MODEL_48a5bb74641a4a2fba370c0ddad1f6cb"
],
- "layout": "IPY_MODEL_12bd0cd379754967bfd5481d5836b7a4"
+ "layout": "IPY_MODEL_1b0971b224444e2c8ddbf817f2f02131"
}
},
- "0de691bf20804830ba5e6710c205c9ac": {
+ "17d4993dc58949ca87a852e7e6c02e0c": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -3815,13 +3814,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_d55d326ffbdc420da0a399c141f7fb56",
+ "layout": "IPY_MODEL_07c9e3207eb04c5fb004744c3e4eb3b2",
"placeholder": "",
- "style": "IPY_MODEL_092323b59b734eada8d88197d9f0eb72",
+ "style": "IPY_MODEL_957e7a116bad4dee93ab449d7766d8ba",
"value": "Downloading (…)"pytorch_model.bin";: 100%"
}
},
- "7ee532c002784554b12fede964c6c05a": {
+ "db24a85aa3e24a2c9275b9aa4ac78faa": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -3837,15 +3836,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_622df288b2ae4f62b776cb101de18b9f",
+ "layout": "IPY_MODEL_1a2ed54b1c584fa3bd2e0517a878790f",
"max": 990402637,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_c72abd216b9444ef9bdb0f8a0a6771b0",
+ "style": "IPY_MODEL_444add600a24462aa2272f2758ddb99d",
"value": 990402637
}
},
- "25e5c76c84a8414495b61663250825aa": {
+ "48a5bb74641a4a2fba370c0ddad1f6cb": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -3860,13 +3859,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_03d5f2402e464b7cb5244db0f824df1d",
+ "layout": "IPY_MODEL_98a9c4dc9bf349d1a8cf985c6a132530",
"placeholder": "",
- "style": "IPY_MODEL_4a6e196f590d4b329e0edefc910d4730",
- "value": " 990M/990M [00:09<00:00, 135MB/s]"
+ "style": "IPY_MODEL_4d94cb68eed54ffd97cc8272f70a92f3",
+ "value": " 990M/990M [00:11<00:00, 86.0MB/s]"
}
},
- "12bd0cd379754967bfd5481d5836b7a4": {
+ "1b0971b224444e2c8ddbf817f2f02131": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3918,7 +3917,7 @@
"width": null
}
},
- "d55d326ffbdc420da0a399c141f7fb56": {
+ "07c9e3207eb04c5fb004744c3e4eb3b2": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -3970,7 +3969,7 @@
"width": null
}
},
- "092323b59b734eada8d88197d9f0eb72": {
+ "957e7a116bad4dee93ab449d7766d8ba": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -3985,7 +3984,7 @@
"description_width": ""
}
},
- "622df288b2ae4f62b776cb101de18b9f": {
+ "1a2ed54b1c584fa3bd2e0517a878790f": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -4037,7 +4036,7 @@
"width": null
}
},
- "c72abd216b9444ef9bdb0f8a0a6771b0": {
+ "444add600a24462aa2272f2758ddb99d": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -4053,7 +4052,7 @@
"description_width": ""
}
},
- "03d5f2402e464b7cb5244db0f824df1d": {
+ "98a9c4dc9bf349d1a8cf985c6a132530": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -4105,7 +4104,7 @@
"width": null
}
},
- "4a6e196f590d4b329e0edefc910d4730": {
+ "4d94cb68eed54ffd97cc8272f70a92f3": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -4120,7 +4119,7 @@
"description_width": ""
}
},
- "9a04f6723e2a40288eb42eea0134dfaf": {
+ "c2a8099dd85e42599911991b467a7afe": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
@@ -4135,14 +4134,14 @@
"_view_name": "HBoxView",
"box_style": "",
"children": [
- "IPY_MODEL_4065d0eed87e4d268de8f4536287e225",
- "IPY_MODEL_bebca147a83446abaf19c3e3db11744e",
- "IPY_MODEL_cf525a599ca245b19204bfff3fa1bd11"
+ "IPY_MODEL_72d0effc5d0948378103da4b2c8da5ae",
+ "IPY_MODEL_cf3ac6e0e69643639d6b0a2577fff71a",
+ "IPY_MODEL_d8f4949af74342d3b72200484ee3f1fb"
],
- "layout": "IPY_MODEL_b60759f0730343849ef3e51d2c8be38c"
+ "layout": "IPY_MODEL_ff42d87d84694bb2a6a7e63e43750029"
}
},
- "4065d0eed87e4d268de8f4536287e225": {
+ "72d0effc5d0948378103da4b2c8da5ae": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -4157,13 +4156,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_dcc795e3fac0401b9a4d2aac3bd6e8cc",
+ "layout": "IPY_MODEL_ae619521ac64447b91b9fb26c46e696a",
"placeholder": "",
- "style": "IPY_MODEL_ed7ca6da408842b38a466097ec9d4616",
+ "style": "IPY_MODEL_62a20c9c11f4452389dfdde24fa90d03",
"value": "Downloading (…)neration_config.json: 100%"
}
},
- "bebca147a83446abaf19c3e3db11744e": {
+ "cf3ac6e0e69643639d6b0a2577fff71a": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
@@ -4179,15 +4178,15 @@
"bar_style": "success",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_0335f29f40564adf9b577707dfb40aa9",
+ "layout": "IPY_MODEL_cb94c6469891495db93c332e2b707299",
"max": 147,
"min": 0,
"orientation": "horizontal",
- "style": "IPY_MODEL_a200da1478fa46a19695a5b2f2c77fd1",
+ "style": "IPY_MODEL_4e0b6f1f2b2f497d9b6e0183b0bc7ade",
"value": 147
}
},
- "cf525a599ca245b19204bfff3fa1bd11": {
+ "d8f4949af74342d3b72200484ee3f1fb": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
@@ -4202,13 +4201,13 @@
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
- "layout": "IPY_MODEL_e21e75bbbc4149b4ac85fece44aee355",
+ "layout": "IPY_MODEL_999d0e74507b4acfae447018abb03323",
"placeholder": "",
- "style": "IPY_MODEL_c014c271cd374f62a0d113efca14001a",
- "value": " 147/147 [00:00<00:00, 6.16kB/s]"
+ "style": "IPY_MODEL_eaa726bb3b9d45d29c011053e844a97e",
+ "value": " 147/147 [00:00<00:00, 4.33kB/s]"
}
},
- "b60759f0730343849ef3e51d2c8be38c": {
+ "ff42d87d84694bb2a6a7e63e43750029": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -4260,7 +4259,7 @@
"width": null
}
},
- "dcc795e3fac0401b9a4d2aac3bd6e8cc": {
+ "ae619521ac64447b91b9fb26c46e696a": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -4312,7 +4311,7 @@
"width": null
}
},
- "ed7ca6da408842b38a466097ec9d4616": {
+ "62a20c9c11f4452389dfdde24fa90d03": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -4327,7 +4326,7 @@
"description_width": ""
}
},
- "0335f29f40564adf9b577707dfb40aa9": {
+ "cb94c6469891495db93c332e2b707299": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -4379,7 +4378,7 @@
"width": null
}
},
- "a200da1478fa46a19695a5b2f2c77fd1": {
+ "4e0b6f1f2b2f497d9b6e0183b0bc7ade": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
@@ -4395,7 +4394,7 @@
"description_width": ""
}
},
- "e21e75bbbc4149b4ac85fece44aee355": {
+ "999d0e74507b4acfae447018abb03323": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
@@ -4447,7 +4446,7 @@
"width": null
}
},
- "c014c271cd374f62a0d113efca14001a": {
+ "eaa726bb3b9d45d29c011053e844a97e": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
@@ -4463,7 +4462,8 @@
}
}
}
- }
+ },
+ "accelerator": "GPU"
},
"cells": [
{
@@ -4483,7 +4483,7 @@
"base_uri": "https://localhost:8080/"
},
"id": "8l0hzptKNiZS",
- "outputId": "6ebbbe8e-00ec-4108-d209-e7dd267f6d1e"
+ "outputId": "f5a51cde-6e0a-46dd-a5bd-682bdd4f173b"
},
"outputs": [
{
@@ -4493,57 +4493,57 @@
"Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n",
"Collecting transformers\n",
" Downloading transformers-4.26.1-py3-none-any.whl (6.3 MB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m6.3/6.3 MB\u001b[0m \u001b[31m47.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m6.3/6.3 MB\u001b[0m \u001b[31m83.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[?25hCollecting datasets\n",
" Downloading datasets-2.9.0-py3-none-any.whl (462 kB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m462.8/462.8 KB\u001b[0m \u001b[31m22.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m462.8/462.8 KB\u001b[0m \u001b[31m51.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[?25hRequirement already satisfied: torch in /usr/local/lib/python3.8/dist-packages (1.13.1+cu116)\n",
"Collecting sentencepiece\n",
" Downloading sentencepiece-0.1.97-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.3 MB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m15.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
- "\u001b[?25hRequirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.8/dist-packages (from transformers) (6.0)\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m81.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[?25hRequirement already satisfied: filelock in /usr/local/lib/python3.8/dist-packages (from transformers) (3.9.0)\n",
+ "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.8/dist-packages (from transformers) (4.64.1)\n",
+ "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.8/dist-packages (from transformers) (1.21.6)\n",
"Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.8/dist-packages (from transformers) (2022.6.2)\n",
+ "Requirement already satisfied: requests in /usr/local/lib/python3.8/dist-packages (from transformers) (2.25.1)\n",
+ "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.8/dist-packages (from transformers) (6.0)\n",
"Collecting huggingface-hub<1.0,>=0.11.0\n",
" Downloading huggingface_hub-0.12.0-py3-none-any.whl (190 kB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m190.3/190.3 KB\u001b[0m \u001b[31m13.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m190.3/190.3 KB\u001b[0m \u001b[31m26.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[?25hCollecting tokenizers!=0.11.3,<0.14,>=0.11.1\n",
" Downloading tokenizers-0.13.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.6 MB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.6/7.6 MB\u001b[0m \u001b[31m56.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
- "\u001b[?25hRequirement already satisfied: filelock in /usr/local/lib/python3.8/dist-packages (from transformers) (3.9.0)\n",
- "Requirement already satisfied: requests in /usr/local/lib/python3.8/dist-packages (from transformers) (2.25.1)\n",
- "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.8/dist-packages (from transformers) (4.64.1)\n",
- "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.8/dist-packages (from transformers) (23.0)\n",
- "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.8/dist-packages (from transformers) (1.21.6)\n",
- "Collecting multiprocess\n",
- " Downloading multiprocess-0.70.14-py38-none-any.whl (132 kB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m132.0/132.0 KB\u001b[0m \u001b[31m4.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
- "\u001b[?25hRequirement already satisfied: dill<0.3.7 in /usr/local/lib/python3.8/dist-packages (from datasets) (0.3.6)\n",
- "Collecting xxhash\n",
- " Downloading xxhash-3.2.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (213 kB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m213.0/213.0 KB\u001b[0m \u001b[31m8.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
- "\u001b[?25hRequirement already satisfied: pyarrow>=6.0.0 in /usr/local/lib/python3.8/dist-packages (from datasets) (9.0.0)\n",
- "Requirement already satisfied: pandas in /usr/local/lib/python3.8/dist-packages (from datasets) (1.3.5)\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.6/7.6 MB\u001b[0m \u001b[31m87.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[?25hRequirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.8/dist-packages (from transformers) (23.0)\n",
+ "Requirement already satisfied: dill<0.3.7 in /usr/local/lib/python3.8/dist-packages (from datasets) (0.3.6)\n",
"Collecting responses<0.19\n",
" Downloading responses-0.18.0-py3-none-any.whl (38 kB)\n",
- "Requirement already satisfied: aiohttp in /usr/local/lib/python3.8/dist-packages (from datasets) (3.8.3)\n",
"Requirement already satisfied: fsspec[http]>=2021.11.1 in /usr/local/lib/python3.8/dist-packages (from datasets) (2023.1.0)\n",
- "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.8/dist-packages (from torch) (4.4.0)\n",
+ "Requirement already satisfied: pyarrow>=6.0.0 in /usr/local/lib/python3.8/dist-packages (from datasets) (9.0.0)\n",
+ "Collecting xxhash\n",
+ " Downloading xxhash-3.2.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (213 kB)\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m213.0/213.0 KB\u001b[0m \u001b[31m28.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[?25hRequirement already satisfied: pandas in /usr/local/lib/python3.8/dist-packages (from datasets) (1.3.5)\n",
+ "Requirement already satisfied: aiohttp in /usr/local/lib/python3.8/dist-packages (from datasets) (3.8.3)\n",
+ "Collecting multiprocess\n",
+ " Downloading multiprocess-0.70.14-py38-none-any.whl (132 kB)\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m132.0/132.0 KB\u001b[0m \u001b[31m18.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[?25hRequirement already satisfied: typing-extensions in /usr/local/lib/python3.8/dist-packages (from torch) (4.4.0)\n",
+ "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (6.0.4)\n",
+ "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (2.1.1)\n",
+ "Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.8.2)\n",
"Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (22.2.0)\n",
"Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (4.0.2)\n",
- "Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.8.2)\n",
- "Requirement already satisfied: charset-normalizer<3.0,>=2.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (2.1.1)\n",
- "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (6.0.4)\n",
"Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.3.1)\n",
"Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.3.3)\n",
- "Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (1.24.3)\n",
- "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (2022.12.7)\n",
- "Requirement already satisfied: chardet<5,>=3.0.2 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (4.0.0)\n",
"Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (2.10)\n",
+ "Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (1.24.3)\n",
+ "Requirement already satisfied: chardet<5,>=3.0.2 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (4.0.0)\n",
+ "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (2022.12.7)\n",
"Collecting urllib3<1.27,>=1.21.1\n",
" Downloading urllib3-1.26.14-py2.py3-none-any.whl (140 kB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m140.6/140.6 KB\u001b[0m \u001b[31m9.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
- "\u001b[?25hRequirement already satisfied: python-dateutil>=2.7.3 in /usr/local/lib/python3.8/dist-packages (from pandas->datasets) (2.8.2)\n",
- "Requirement already satisfied: pytz>=2017.3 in /usr/local/lib/python3.8/dist-packages (from pandas->datasets) (2022.7.1)\n",
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m140.6/140.6 KB\u001b[0m \u001b[31m19.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+ "\u001b[?25hRequirement already satisfied: pytz>=2017.3 in /usr/local/lib/python3.8/dist-packages (from pandas->datasets) (2022.7.1)\n",
+ "Requirement already satisfied: python-dateutil>=2.7.3 in /usr/local/lib/python3.8/dist-packages (from pandas->datasets) (2.8.2)\n",
"Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.8/dist-packages (from python-dateutil>=2.7.3->pandas->datasets) (1.15.0)\n",
"Installing collected packages: tokenizers, sentencepiece, xxhash, urllib3, multiprocess, responses, huggingface-hub, transformers, datasets\n",
" Attempting uninstall: urllib3\n",
@@ -4586,78 +4586,78 @@
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 244,
+ "height": 231,
"referenced_widgets": [
- "e4bb6f2f32de48d4b1f6d7ecf97ce376",
- "3305b30f1bfa48e9b0c1ba3add06094e",
- "a343619acbb745baa6aa561271ec8815",
- "c493fc54d9eb421f96d6e8519c8a1b0e",
- "12fd6daa8e604ecd9ad731b6296815da",
- "805f497aa3304353a1be8b4cc87bfb54",
- "594a6d13f81f479eb00fa45fd4094146",
- "236979048eb8461f9b7d8c4103905eed",
- "4620faf461ca449a88de45e86467e265",
- "8dc2f0f2e66741edbccab7abaaf634ce",
- "0d49bfb55dfd4090ba57c544eaa97902",
- "4084f218fca64fc9b765e04d0cc073ac",
- "fec67d95a5904ac199f6648a34ef1ff9",
- "a734d44f6baf4a5f8dfda576c09fffca",
- "3fc2d009da594365854aa11be804b388",
- "45c7d35932ec44bcb2ccdc73f0ae6b46",
- "0c1c3db046f24599b27daa44217f48d2",
- "c3f9ed611a154e22b875d0696ef6022d",
- "7fd51c34909b41a8884fa358cccdbf48",
- "9d9edc5471de40c2b7c2b9156637997d",
- "02c64bf3ff95438cb43c7dc52034cc43",
- "f0b71ecb6b1c4d1190ca899af7d3e82c",
- "8cae9c49e18f43248072b5e059429f6d",
- "88c8adca128b44c1bbbec437630c2074",
- "0f73f5e2c8af41eaae5f1c27f212da8b",
- "255b4480e11f4b3e892a5d2dc6abfd4b",
- "a96eab6312f6447b9eff3f914c5a6827",
- "063059d53dc942d1aee9e3fe2f27687d",
- "ca50704df2cc430fae6b5902c5399414",
- "64f5cdd8d1c14be79278ee4de89993d1",
- "f065dcd7d1d34cb6806f2eb28bb3cd6f",
- "67663505c87640b58e04d3ce028537ea",
- "f5a17bc6f9f94b2ca119528b0ca2d456",
- "ec0f16c3cbb14d9287e148887127219b",
- "ba832204e1d4413f8b8a15e10bac7d95",
- "8179dbec98b7466ea2195affb0568498",
- "7e9abda7b55c459b8a9888edaf1cc116",
- "64c8860ae16848af9b04bb41955a8446",
- "64fe250082bf4d4fb126a319920d2f0a",
- "0b278b6f5da94921afbacb873c15d9c9",
- "b688bc7f34e941488831da5d4aed9396",
- "44cec66cbaeb49abb26dbfc5420ceacb",
- "67a750dcfa8b44499956572fda3dbacf",
- "edad6f2eb6704468bd06006c50697f86",
- "699a1bdf38ca48e2affc3c6bd771852f",
- "4e5a92d4acdc43d487290ffd8a842ea5",
- "8bc8c44b6324478a8209094f9b7e9ccd",
- "e95f31e693674a0aae8de0e167a49daf",
- "069a68aed2bb4d37a00c9c0feedd3e17",
- "9930f171a6db47939e996016cb49fe20",
- "ddd0c0abba074aa7a33b5c825ccf8760",
- "8bbb7307312648b0afb901f701a4e466",
- "4a2eb48d3583446598fdd1b7175c96fd",
- "b3eae90c5aea409ab1a2c541948658f8",
- "41b5186c2e194402a1e18f1c1a9f18a4",
- "3c84850ebe3e45d297d3bfa8a12f1b86",
- "8a5f71a073ca4b0cb929ba3cf31fd296",
- "b5be73849b61415fb9187d011261be1e",
- "46a51fbd984344b1958889c608ea04ed",
- "0d25092adebd4f94b1799df263ccaf55",
- "e4814d2ee2df4f6a9f411b134ebca546",
- "09669f6ac72b45689e082b4fb489a23f",
- "7afda94f85794acf882856b760a3eb63",
- "a70df5e47adb4a4d8b80a543dedfd708",
- "140058b69379422797bdc22374192bd6",
- "8aabd23e2fa242e4b8cf4ef43fbebe2e"
+ "a8e120a9a97d45d59fcf275af25a591e",
+ "e665879731604133a593e13155f4e03b",
+ "d451aa9d81ca4d5ea901297e702762c0",
+ "a9edac4d193f4930aa691fa496badc64",
+ "a21e8fec1d92496a835ae8ad71c287ab",
+ "d168c852a75a43f5addcfbc75c48ec14",
+ "589f9c90c98b48bda9ecb020cb384eab",
+ "e35fb285260b4b86aa9854eac11a6dfd",
+ "f505b8ea01ff4e2f90edf1d08c5096b1",
+ "0baf1fcb54e945679e3591276182aa9e",
+ "2d57d4b6086e47e1a7d6a9a1375cc49f",
+ "564f30aef6c34efa952fdd1402627d13",
+ "0ee3c4b36db247d09e7fb9e68e856abb",
+ "03ee22d44e2141d99e54bbd59246b328",
+ "19465851c65e445fbaed11e33ac09098",
+ "6a7e920546444da7bf855620f00c45e0",
+ "e8b69414b5004f489f5c6793b6cc0746",
+ "474f0c044be14860b6a38321281d0d1f",
+ "f2861641cda34f2786112b28bac2b36f",
+ "f07c5cffb60c4a89bb29c49811d73aba",
+ "e502595b7e6b45498d2018e62e6fa6f2",
+ "80b9042089364fae8e0cffc7a49203c1",
+ "ae89e755c6e64ab2a3101913d08820ef",
+ "5181e91045d240308e1371af2a560d56",
+ "3551b2e33fac44f38988c07fc5819b23",
+ "9a418f8782a842898d730f8cbc4fe311",
+ "c9d1c36d765345e183d4cdf911ad07b3",
+ "75a75524abc04743a7533f9030769bb2",
+ "84e9b5aef48c4d429742d0fde6fc125e",
+ "24492355887d405b98f8f42c4be836b6",
+ "5c7cbcd333f145488ab9411512467c19",
+ "6cc08744eb594bbc913da9fc2a15c939",
+ "17c7c64eafb14d168bd386cae79902aa",
+ "db79fbdb9e25432a8f95221cc0bed971",
+ "3c14418eb66d4392bcaa64ca3394084c",
+ "3144d6d798df44afacc4f34bed90f0e4",
+ "9259558984d847ae99435ef4e312e3b7",
+ "1b05d118f33949dfa5daf732520f9c62",
+ "dc652b3692ed4da6b3fd959acb773b66",
+ "ce7027fdd804415db2c60560be3c66e9",
+ "3ab3add96759441eba1571795b0edaae",
+ "d88268e0bb52404e86a37b01fdac5957",
+ "dae3457866114776818227ec44284ced",
+ "2aab0424351e4b9594cdcf631632c690",
+ "6fd330314de74ccc983da44783bcac7d",
+ "209778054761411190cf91741a43b2d3",
+ "5d45d48713924a8d805368867c7bb5e0",
+ "fa0715f8876c401ba6a2681d0abf7e5a",
+ "b6afff9e8ee44d42814dc84670ed999f",
+ "7b636bb9a4724d2783148aa8d6aa791e",
+ "dd488415b19349d8a5306153907ba902",
+ "174930418d51405f969eaa6b5aa67dde",
+ "75f8a0de12974b84a4b8bde1a16c33c4",
+ "101281b2ecf441a39abc9d4e49398e43",
+ "20ad8bc6a1c94be090190ea3de64a10f",
+ "99cbe58514e3460398f032b93a57d068",
+ "797dcecef4874b9f8de64e643661c637",
+ "9d97e656e72d4f99a2b4669e811918cd",
+ "df4a5058866c4ec8875cfb5189c738c5",
+ "fcd408ec35cd44f1b7309931256adfaa",
+ "2ab3431929a540609d0edac159d63d41",
+ "fa0e9bb620c04cca998be8929f50c4d8",
+ "4d131181a5fa4f0880946ef5cd984790",
+ "2f3024af40c346a188793eeddff5848b",
+ "914ceee224b244b9ac0492305fb1fb24",
+ "5e394d73c2df4d34b39989cd1b24dc57"
]
},
"id": "cCiAuRqrOkvV",
- "outputId": "394df630-e545-4005-b3a4-82b0341b210b"
+ "outputId": "0a6da048-12e3-41b6-b623-d21cb246030c"
},
"execution_count": 3,
"outputs": [
@@ -4670,7 +4670,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "e4bb6f2f32de48d4b1f6d7ecf97ce376"
+ "model_id": "a8e120a9a97d45d59fcf275af25a591e"
}
},
"metadata": {}
@@ -4684,7 +4684,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "4084f218fca64fc9b765e04d0cc073ac"
+ "model_id": "564f30aef6c34efa952fdd1402627d13"
}
},
"metadata": {}
@@ -4698,7 +4698,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "8cae9c49e18f43248072b5e059429f6d"
+ "model_id": "ae89e755c6e64ab2a3101913d08820ef"
}
},
"metadata": {}
@@ -4719,7 +4719,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "ec0f16c3cbb14d9287e148887127219b"
+ "model_id": "db79fbdb9e25432a8f95221cc0bed971"
}
},
"metadata": {}
@@ -4733,7 +4733,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "699a1bdf38ca48e2affc3c6bd771852f"
+ "model_id": "6fd330314de74ccc983da44783bcac7d"
}
},
"metadata": {}
@@ -4754,7 +4754,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "3c84850ebe3e45d297d3bfa8a12f1b86"
+ "model_id": "99cbe58514e3460398f032b93a57d068"
}
},
"metadata": {}
@@ -4764,14 +4764,14 @@
{
"cell_type": "code",
"source": [
- "dataset['train'][123]"
+ "dataset['train'][0]"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "JKFHPko3OnAV",
- "outputId": "423375ec-0be7-431b-8a65-f531df1d94d8"
+ "outputId": "e9aeffd1-9049-48fc-e59c-0ff8c43cd0f4"
},
"execution_count": 4,
"outputs": [
@@ -4779,8 +4779,8 @@
"output_type": "execute_result",
"data": {
"text/plain": [
- "{'sms': 'Todays Voda numbers ending 7548 are selected to receive a $350 award. If you have a match please call 08712300220 quoting claim code 4041 standard rates app\\n',\n",
- " 'label': 1}"
+ "{'sms': 'Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\\n',\n",
+ " 'label': 0}"
]
},
"metadata": {},
@@ -4791,7 +4791,7 @@
{
"cell_type": "markdown",
"source": [
- "# Modyfikacja datasetu - klasyfikacja zero-shot"
+ "# Przygotowanie datasetu"
],
"metadata": {
"id": "l140vJrgYxPr"
@@ -4803,13 +4803,13 @@
"parsed_dataset = []\n",
"\n",
"for row in dataset['train']:\n",
- " text = \"Answer the question in one word - true if provided text is spam or false, if provided text is not spam.\\n Q: Is this text spam? \\nText: \" + row['sms'] + \"A: \"\n",
+ " text = row['sms'].replace(\"\\n\", \"\")\n",
" new_row = {}\n",
" new_row['sms'] = text\n",
" if row['label'] == 0:\n",
- " new_row['label'] = \"true\"\n",
+ " new_row['label'] = \"False\"\n",
" else:\n",
- " new_row['label'] = \"false\"\n",
+ " new_row['label'] = \"True\"\n",
" parsed_dataset.append(new_row)\n",
"\n",
"parsed_dataset[0]"
@@ -4819,7 +4819,7 @@
"base_uri": "https://localhost:8080/"
},
"id": "1boUF-YiY3_y",
- "outputId": "a7ecfad8-7c97-4de2-8852-80b28ea7c965"
+ "outputId": "d0088428-9014-43bf-e5d1-920042374797"
},
"execution_count": 5,
"outputs": [
@@ -4827,8 +4827,8 @@
"output_type": "execute_result",
"data": {
"text/plain": [
- "{'sms': 'Answer the question in one word - true if provided text is spam or false, if provided text is not spam.\\n Q: Is this text spam? \\nText: Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\\nA: ',\n",
- " 'label': 'true'}"
+ "{'sms': 'Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...',\n",
+ " 'label': 'False'}"
]
},
"metadata": {},
@@ -4866,54 +4866,54 @@
"base_uri": "https://localhost:8080/",
"height": 145,
"referenced_widgets": [
- "040698c1b4be4adebfe751751a64c11d",
- "11b4ddede4494fe093329c50097b7df5",
- "7986c625c9c34d039fad240333d0da08",
- "b35a6f8e81184f81990a0111cc5c6ca8",
- "2968992398a94adeb626eec2f45a8699",
- "c9f8f67483fb45c8a6b59fceae40fe42",
- "c5a862e7d71c430c865fa87dc21b1f6d",
- "d69171bdd6544c8ab9e96f3f3dfe7f92",
- "9cca59c67c5f452eb1d9e8dd22296968",
- "0f18ab0690ce4bc3b9b7c2f4d10c2049",
- "af26b98c1e3440daa11e104ed1c8b7e4",
- "be9060616d68475ea2e4674f7e460566",
- "264afd978de54dbeaa1b711e4c0b1c07",
- "bbcefda6eea74b8ea8313e4f7167df65",
- "68d85f6957ea4807a1fe7c82c9a7bc06",
- "cdfaf060f34a4d23afe97243d5f4c709",
- "9411023294ab44b284894aebf3f8f589",
- "d8bf78a3d7ea47a9824d6e01e70b0237",
- "b95ece9507db467fad710338bdf29177",
- "34a31746a99c4916b1402a2829e71a98",
- "29b2a7a233a9484c92056034cc70b8ca",
- "c9a72e2599e94e9e9bc2b4912d25877b",
- "2c24af439f3e45db8a0e004686e912ed",
- "dcb13b35232145fd85be1b6e4442cc5a",
- "58037f9984bb414a9c6e56337d86215c",
- "6e9379baaf2049658790e176ca279531",
- "772e39d516cf43fdbb1b3db001d53d77",
- "c08c1e0783324c53b7fc02912fa14af9",
- "9bcdda510c0147178f651b66450b48ac",
- "18ab5e8088e04cdca93df7519156a59f",
- "f502a26154d840b89b5c61a2aae4f827",
- "7beb993a979443dcb93d26ec6e6718c3",
- "62e60fc862054e4d8d0d18cb1957cf6d",
- "bd697213d4fa4c1d9119657c537e78fe",
- "67f9f97815354675bf3bd435f2ed0436",
- "27bd6c78e7f74ff385509e9856c2b8d0",
- "34f670acaa3542eebc8c19018e900ce3",
- "ec2d082874844b6daf8542824bfde1a0",
- "b9df5fc8959447449d873bd17e6696f7",
- "f8489ecaa1a844369bcb427c5f4c95e6",
- "b21e65a9dff040f4a045580d9989ac20",
- "0efa19170c9e4de891e328365543c916",
- "8c6fa802ddd5491581c092e5422bfeab",
- "42cfc2ada7ac408fab39251add66f6ef"
+ "6fb269ceeada49c19adf46819664fa98",
+ "341f67fcddff4a91813fb1331fd63c3e",
+ "33c7a0d0629342288601999a3b11d71c",
+ "87d7f2540c724ba88b6f972049043702",
+ "36111c073ea34489886c767532713233",
+ "c05a5532720d47e39e6cb710617aab67",
+ "458619b05af848fe8f40fac408e4c521",
+ "3cf20c5c605b46e1bc4890769cdeffe3",
+ "15c19b89e55243cc88e77c56895d56b4",
+ "b4dd2e86dd6a4d579f315293d4b0ba21",
+ "60577d05c1ad4acea832bd4e34efa6f4",
+ "4f67d0fe28914c1bb3d1057225c409cd",
+ "f384fc9cd7f2428fad3b6d10ffac7efd",
+ "36838c7736594b1b83f3046c8f0cc265",
+ "b98e34b842054f99ae1ac5f96104321f",
+ "a4ce8092283747e89e730a7e39e64834",
+ "0aa55ed422a94e94b01c117598842a10",
+ "d54619fbb71e441eb90d9c42145ba07b",
+ "da3487b705264da9a8f92254e568b76e",
+ "9f378f21d7804f49ad9f72ccabb4a10b",
+ "ebb15c7aaf1d4b59a2186e2abbea2868",
+ "6510cda1ab33418882a1e6811f826ed4",
+ "0b3c6eb43a5c4644adbc17ee2b06b079",
+ "fcb7ce49c0c14dc4a5dbbd9870334921",
+ "2f58b16a741f4f1d822c71c17a1c5606",
+ "35cbd0d168714ecc9f0c9236b3707d0a",
+ "b9393265011640c493b2bd4de43a4aef",
+ "eaeeca2372be4fe3868d2d3f42839bc2",
+ "079b78ca1493431880754da6fc4ac127",
+ "6c7e4ab3930c4570a05a4e3d9db6782d",
+ "2ae3b00d50f04990b8c1839dfa705dc8",
+ "cfcae44ed5734d7086ecb5028281cf9a",
+ "281ca6dc827f41d3833ba1c60606529d",
+ "bce6a704b2924287b8b9279d791b633b",
+ "b1dae5dc568446b0ba896b3abe3afb49",
+ "29ff3a3e656a489182943da91cd73813",
+ "585cf66f9f3648e0b950ca04eb17cc63",
+ "71e629333d5d4009bc8072b9f12c0cee",
+ "d5438b0c54104ddd99ed097fa65bc21c",
+ "224c2c07bdc5444aaddf46ca6325e681",
+ "197d80f118764b65b29ad5049edd0087",
+ "e0326b59a1334117bbe6ccb06c1f4020",
+ "6fd86b989a354a2696c8b9e880109a95",
+ "2caff09a31ad46f59e717e25462b12d6"
]
},
"id": "q5Jz0E_oPMBr",
- "outputId": "c71131a5-4737-4354-e58f-17aa88116348"
+ "outputId": "b3c09e2f-577b-49e9-8ae7-cc9cede74cc8"
},
"execution_count": 7,
"outputs": [
@@ -4926,7 +4926,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "040698c1b4be4adebfe751751a64c11d"
+ "model_id": "6fb269ceeada49c19adf46819664fa98"
}
},
"metadata": {}
@@ -4940,7 +4940,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "be9060616d68475ea2e4674f7e460566"
+ "model_id": "4f67d0fe28914c1bb3d1057225c409cd"
}
},
"metadata": {}
@@ -4954,7 +4954,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "2c24af439f3e45db8a0e004686e912ed"
+ "model_id": "0b3c6eb43a5c4644adbc17ee2b06b079"
}
},
"metadata": {}
@@ -4968,7 +4968,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "bd697213d4fa4c1d9119657c537e78fe"
+ "model_id": "bce6a704b2924287b8b9279d791b633b"
}
},
"metadata": {}
@@ -4979,7 +4979,7 @@
"cell_type": "code",
"source": [
"sms = parsed_dataset[0]['sms']\n",
- "print('Original: \\n', sms)\n",
+ "print('Original: ', sms)\n",
"print('Tokenized: ', tokenizer.tokenize(sms))\n",
"print('Token IDs: ', tokenizer.convert_tokens_to_ids(tokenizer.tokenize(sms)))"
],
@@ -4988,7 +4988,7 @@
"base_uri": "https://localhost:8080/"
},
"id": "dfxJQpoePsvI",
- "outputId": "2ce963db-ed94-467a-e859-fd0515849ee2"
+ "outputId": "00e742fc-45d6-49d8-b5a5-f42f7c8f5037"
},
"execution_count": 8,
"outputs": [
@@ -4996,13 +4996,9 @@
"output_type": "stream",
"name": "stdout",
"text": [
- "Original: \n",
- " Answer the question in one word - true if provided text is spam or false, if provided text is not spam.\n",
- " Q: Is this text spam? \n",
- "Text: Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\n",
- "A: \n",
- "Tokenized: ['▁Answer', '▁the', '▁question', '▁in', '▁one', '▁word', '▁', '-', '▁true', '▁', 'if', '▁provided', '▁text', '▁is', '▁spam', '▁or', '▁false', ',', '▁', 'if', '▁provided', '▁text', '▁is', '▁not', '▁spam', '.', '▁Q', ':', '▁I', 's', '▁this', '▁text', '▁spam', '?', '▁Text', ':', '▁Go', '▁until', '▁jur', 'ong', '▁point', ',', '▁crazy', '.', '.', '▁Available', '▁only', '▁in', '▁bug', 'is', '▁', 'n', '▁great', '▁world', '▁la', '▁', 'e', '▁buffet', '...', '▁Cine', '▁there', '▁got', '▁', 'a', 'more', '▁wa', 't', '...', '▁A', ':', '▁']\n",
- "Token IDs: [11801, 8, 822, 16, 80, 1448, 3, 18, 1176, 3, 99, 937, 1499, 19, 13655, 42, 6136, 6, 3, 99, 937, 1499, 19, 59, 13655, 5, 1593, 10, 27, 7, 48, 1499, 13655, 58, 5027, 10, 1263, 552, 10081, 2444, 500, 6, 6139, 5, 5, 8144, 163, 16, 8143, 159, 3, 29, 248, 296, 50, 3, 15, 15385, 233, 17270, 132, 530, 3, 9, 3706, 8036, 17, 233, 71, 10, 3]\n"
+ "Original: Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\n",
+ "Tokenized: ['▁Go', '▁until', '▁jur', 'ong', '▁point', ',', '▁crazy', '.', '.', '▁Available', '▁only', '▁in', '▁bug', 'is', '▁', 'n', '▁great', '▁world', '▁la', '▁', 'e', '▁buffet', '...', '▁Cine', '▁there', '▁got', '▁', 'a', 'more', '▁wa', 't', '...']\n",
+ "Token IDs: [1263, 552, 10081, 2444, 500, 6, 6139, 5, 5, 8144, 163, 16, 8143, 159, 3, 29, 248, 296, 50, 3, 15, 15385, 233, 17270, 132, 530, 3, 9, 3706, 8036, 17, 233]\n"
]
}
]
@@ -5010,7 +5006,7 @@
{
"cell_type": "markdown",
"source": [
- "# Check maximum lenght of a sentence"
+ "# Few shot learning"
],
"metadata": {
"id": "UpluhM8cU5Ir"
@@ -5019,28 +5015,28 @@
{
"cell_type": "code",
"source": [
- "max_len = 0\n",
- "\n",
- "for sentence in parsed_dataset:\n",
- " input_ids = tokenizer.encode(sentence['sms'], add_special_tokens=True)\n",
- " max_len = max(max_len, len(input_ids))\n",
- "\n",
- "print('Max sentence length: ', max_len)"
+ "print(parsed_dataset[0]) #0\n",
+ "print(parsed_dataset[123]) #1\n",
+ "print(parsed_dataset[2000]) #0\n",
+ "print(parsed_dataset[3002]) #1"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "7uNUkixPU85O",
- "outputId": "352b31bb-164e-42a8-a8b0-6be9d3eca0c4"
+ "outputId": "9c2c8ef6-30c3-4043-b1a8-f33715d10334"
},
- "execution_count": 12,
+ "execution_count": 9,
"outputs": [
{
"output_type": "stream",
"name": "stdout",
"text": [
- "Max sentence length: 377\n"
+ "{'sms': 'Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...', 'label': 'False'}\n",
+ "{'sms': 'Todays Voda numbers ending 7548 are selected to receive a $350 award. If you have a match please call 08712300220 quoting claim code 4041 standard rates app', 'label': 'True'}\n",
+ "{'sms': \"LMAO where's your fish memory when I need it?\", 'label': 'False'}\n",
+ "{'sms': 'This message is free. Welcome to the new & improved Sex & Dogging club! To unsubscribe from this service reply STOP. msgs@150p 18+only', 'label': 'True'}\n"
]
}
]
@@ -5048,285 +5044,40 @@
{
"cell_type": "code",
"source": [
- "max_label_len = 0\n",
+ "non_spam_1 = \"SMS: \" + parsed_dataset[0]['sms'] + \"\\nSpam: False\\n\\n\"\n",
+ "spam_1 = \"SMS: \" + parsed_dataset[123]['sms'] + \"\\nSpam: True\\n\\n\"\n",
+ "non_spam_2 = \"SMS: \" + parsed_dataset[2000]['sms'] + \"\\nSpam: False\\n\\n\"\n",
+ "spam_2 = \"SMS: \" + parsed_dataset[3002]['sms'] + \"\\nSpam: True\\n\\n\"\n",
"\n",
- "for sentence in parsed_dataset:\n",
- " input_ids = tokenizer.encode(sentence['label'], add_special_tokens=True)\n",
- " max_label_len = max(max_label_len, len(input_ids))\n",
- "\n",
- "print('Max sentence length: ', max_label_len)"
+ "few_shot_prefix = non_spam_1 + spam_1 + non_spam_2 + spam_2 + \"SMS: \"\n",
+ "print(few_shot_prefix)"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "lj0issBznZfK",
- "outputId": "53defde8-ed8d-4927-add4-5d7d63f737df"
+ "outputId": "a8aa4038-4145-4950-9d9f-91593a550d12"
},
- "execution_count": 13,
+ "execution_count": 10,
"outputs": [
{
"output_type": "stream",
"name": "stdout",
"text": [
- "Max sentence length: 2\n"
- ]
- }
- ]
- },
- {
- "cell_type": "markdown",
- "source": [
- "# Pre train tokenization"
- ],
- "metadata": {
- "id": "nfw62HdgSERb"
- }
- },
- {
- "cell_type": "code",
- "source": [
- "import torch"
- ],
- "metadata": {
- "id": "KTXYalS1VLqH"
- },
- "execution_count": 11,
- "outputs": []
- },
- {
- "cell_type": "code",
- "source": [
- "input_ids = []\n",
- "target_ids = []\n",
- "attention_masks = []\n",
- "\n",
- "for sentence in parsed_dataset:\n",
- " encoded_dict = tokenizer.encode_plus(\n",
- " sentence['sms'],\n",
- " add_special_tokens = True,\n",
- " max_length = 380,\n",
- " padding = 'max_length',\n",
- " truncation=True,\n",
- " return_attention_mask = True,\n",
- " return_tensors = 'pt',\n",
- " )\n",
- " \n",
- " encoded_target_dict = tokenizer.encode_plus(\n",
- " sentence['label'],\n",
- " add_special_tokens = True,\n",
- " max_length = 2,\n",
- " padding = 'max_length',\n",
- " truncation=True,\n",
- " return_attention_mask = True,\n",
- " return_tensors = 'pt',\n",
- " )\n",
- " \n",
- " input_ids.append(encoded_dict['input_ids'])\n",
- " target_ids.append(encoded_target_dict['input_ids'])\n",
- " attention_masks.append(encoded_dict['attention_mask'])\n",
- "\n",
- "input_ids = torch.cat(input_ids, dim=0)\n",
- "target_ids = torch.cat(target_ids, dim=0)\n",
- "attention_masks = torch.cat(attention_masks, dim=0)\n",
- "\n",
- "print('Original: ', parsed_dataset[0])\n",
- "print('Token IDs:', input_ids[0])\n",
- "print('Label token IDs:', target_ids[0])"
- ],
- "metadata": {
- "colab": {
- "base_uri": "https://localhost:8080/"
- },
- "id": "Z28QYfLnSGxR",
- "outputId": "eb9d48d0-cb2d-4596-c752-14b18f6e3590"
- },
- "execution_count": 14,
- "outputs": [
- {
- "output_type": "stream",
- "name": "stdout",
- "text": [
- "Original: {'sms': 'Answer the question in one word - true if provided text is spam or false, if provided text is not spam.\\n Q: Is this text spam? \\nText: Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\\nA: ', 'label': 'true'}\n",
- "Token IDs: tensor([11801, 8, 822, 16, 80, 1448, 3, 18, 1176, 3,\n",
- " 99, 937, 1499, 19, 13655, 42, 6136, 6, 3, 99,\n",
- " 937, 1499, 19, 59, 13655, 5, 1593, 10, 27, 7,\n",
- " 48, 1499, 13655, 58, 5027, 10, 1263, 552, 10081, 2444,\n",
- " 500, 6, 6139, 5, 5, 8144, 163, 16, 8143, 159,\n",
- " 3, 29, 248, 296, 50, 3, 15, 15385, 233, 17270,\n",
- " 132, 530, 3, 9, 3706, 8036, 17, 233, 71, 10,\n",
- " 3, 1, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,\n",
- " 0, 0, 0, 0, 0, 0, 0, 0, 0, 0])\n",
- "Label token IDs: tensor([1176, 1])\n"
- ]
- }
- ]
- },
- {
- "cell_type": "markdown",
- "source": [
- "# Split dataset"
- ],
- "metadata": {
- "id": "qD_t0y0KVVSy"
- }
- },
- {
- "cell_type": "code",
- "source": [
- "from torch.utils.data import TensorDataset, random_split"
- ],
- "metadata": {
- "id": "vN_SatRIVa4c"
- },
- "execution_count": 15,
- "outputs": []
- },
- {
- "cell_type": "code",
- "source": [
- "dataset = TensorDataset(input_ids, attention_masks, target_ids)\n",
- "\n",
- "test_size = 1000\n",
- "dataset_len = len(dataset)\n",
- "train_size = int(0.9 * (dataset_len-test_size))\n",
- "val_size = (dataset_len-test_size) - train_size\n",
- "\n",
- "test_dataset, train_dataset, val_dataset = random_split(dataset, [test_size, train_size, val_size])\n",
- "\n",
- "print('{:>5,} test samples'.format(test_size))\n",
- "print('{:>5,} training samples'.format(train_size))\n",
- "print('{:>5,} validation samples'.format(val_size))"
- ],
- "metadata": {
- "colab": {
- "base_uri": "https://localhost:8080/"
- },
- "id": "Mm6vc6lLVW3l",
- "outputId": "023efb5b-eab3-4675-9900-3918aedae90f"
- },
- "execution_count": 16,
- "outputs": [
- {
- "output_type": "stream",
- "name": "stdout",
- "text": [
- "1,000 test samples\n",
- "4,116 training samples\n",
- " 458 validation samples\n"
- ]
- }
- ]
- },
- {
- "cell_type": "markdown",
- "source": [
- "# Create train and validation loaders"
- ],
- "metadata": {
- "id": "bmgQOP4EVfA1"
- }
- },
- {
- "cell_type": "code",
- "source": [
- "from torch.utils.data import DataLoader, RandomSampler, SequentialSampler"
- ],
- "metadata": {
- "id": "CxnQ3cmIVlNh"
- },
- "execution_count": 17,
- "outputs": []
- },
- {
- "cell_type": "code",
- "source": [
- "batch_size = 8\n",
- "\n",
- "train_dataloader = DataLoader(\n",
- " train_dataset,\n",
- " sampler = RandomSampler(train_dataset),\n",
- " batch_size = batch_size\n",
- " )\n",
- "\n",
- "validation_dataloader = DataLoader(\n",
- " val_dataset,\n",
- " sampler = SequentialSampler(val_dataset),\n",
- " batch_size = batch_size\n",
- " )"
- ],
- "metadata": {
- "id": "0hcpO_onVjEC"
- },
- "execution_count": 18,
- "outputs": []
- },
- {
- "cell_type": "markdown",
- "source": [
- "# Device check"
- ],
- "metadata": {
- "id": "efwhqLyyVu9z"
- }
- },
- {
- "cell_type": "code",
- "source": [
- "if torch.cuda.is_available(): \n",
- " device = torch.device(\"cuda\")\n",
- "\n",
- " print('There are %d GPU(s) available.' % torch.cuda.device_count())\n",
- " print('We will use the GPU:', torch.cuda.get_device_name(0))\n",
- "\n",
- "else:\n",
- " print('No GPU available, using the CPU instead.')\n",
- " device = torch.device(\"cpu\")"
- ],
- "metadata": {
- "colab": {
- "base_uri": "https://localhost:8080/"
- },
- "id": "ANBCfNGnVwVk",
- "outputId": "6192e88f-5e61-4de6-b476-de9a6e3a59a6"
- },
- "execution_count": 19,
- "outputs": [
- {
- "output_type": "stream",
- "name": "stdout",
- "text": [
- "There are 1 GPU(s) available.\n",
- "We will use the GPU: Tesla T4\n"
+ "SMS: Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\n",
+ "Spam: False\n",
+ "\n",
+ "SMS: Todays Voda numbers ending 7548 are selected to receive a $350 award. If you have a match please call 08712300220 quoting claim code 4041 standard rates app\n",
+ "Spam: True\n",
+ "\n",
+ "SMS: LMAO where's your fish memory when I need it?\n",
+ "Spam: False\n",
+ "\n",
+ "SMS: This message is free. Welcome to the new & improved Sex & Dogging club! To unsubscribe from this service reply STOP. msgs@150p 18+only\n",
+ "Spam: True\n",
+ "\n",
+ "SMS: \n"
]
}
]
@@ -5348,7 +5099,7 @@
"metadata": {
"id": "Eu-7Eed8WgN0"
},
- "execution_count": 20,
+ "execution_count": 11,
"outputs": []
},
{
@@ -5363,45 +5114,45 @@
"base_uri": "https://localhost:8080/",
"height": 1000,
"referenced_widgets": [
- "3747d0aa68d642449ff32b7efd47d497",
- "2a84ccf3660a4e24b37bfc1d952f06d9",
- "43b98452768846eb9b773839a4681cc6",
- "2dfbcef644a84b558ce99b2ddaf091b6",
- "9dd02373a1994433a49e0015b76dd858",
- "42a620dfccb4416c95fbd7a76637dc73",
- "9d953b41e24c4263b18e1ff2174eb797",
- "cb409960af114fa690bac72c1d51d2ab",
- "995a94c35b4c441b86598d1976281711",
- "4ea2ccb5fa264dd5a042f570c22db7de",
- "4d5668e5b66d4993b935b077a1dc281c",
- "cf36c750119449e8a16aa97a9b66a124",
- "0de691bf20804830ba5e6710c205c9ac",
- "7ee532c002784554b12fede964c6c05a",
- "25e5c76c84a8414495b61663250825aa",
- "12bd0cd379754967bfd5481d5836b7a4",
- "d55d326ffbdc420da0a399c141f7fb56",
- "092323b59b734eada8d88197d9f0eb72",
- "622df288b2ae4f62b776cb101de18b9f",
- "c72abd216b9444ef9bdb0f8a0a6771b0",
- "03d5f2402e464b7cb5244db0f824df1d",
- "4a6e196f590d4b329e0edefc910d4730",
- "9a04f6723e2a40288eb42eea0134dfaf",
- "4065d0eed87e4d268de8f4536287e225",
- "bebca147a83446abaf19c3e3db11744e",
- "cf525a599ca245b19204bfff3fa1bd11",
- "b60759f0730343849ef3e51d2c8be38c",
- "dcc795e3fac0401b9a4d2aac3bd6e8cc",
- "ed7ca6da408842b38a466097ec9d4616",
- "0335f29f40564adf9b577707dfb40aa9",
- "a200da1478fa46a19695a5b2f2c77fd1",
- "e21e75bbbc4149b4ac85fece44aee355",
- "c014c271cd374f62a0d113efca14001a"
+ "8e60f2b1a9f7455db02eb846af52df63",
+ "71ff180cc81a4376b6a27455ed5cba26",
+ "4dc7c026d3e5469da3ada03bf77d7019",
+ "279308acf5be418ab7f25c3501739c9d",
+ "5c4c0f7bfb6c4a518cdfd3f1d70e77d5",
+ "7182f8c40174456db2d6f974e1a672a9",
+ "f34bf1f4156b4dec8990f16cbceccb00",
+ "bcf3f636355347338e1d57c191e2349f",
+ "e36598bd61874b4eb737d248df7c1212",
+ "f9c113d3c4f64aee969c897451b4522e",
+ "fc647c0c0bd14b87b59d539db3793d0a",
+ "3fcb6b4a0c454d59a6d5503cec84ba37",
+ "17d4993dc58949ca87a852e7e6c02e0c",
+ "db24a85aa3e24a2c9275b9aa4ac78faa",
+ "48a5bb74641a4a2fba370c0ddad1f6cb",
+ "1b0971b224444e2c8ddbf817f2f02131",
+ "07c9e3207eb04c5fb004744c3e4eb3b2",
+ "957e7a116bad4dee93ab449d7766d8ba",
+ "1a2ed54b1c584fa3bd2e0517a878790f",
+ "444add600a24462aa2272f2758ddb99d",
+ "98a9c4dc9bf349d1a8cf985c6a132530",
+ "4d94cb68eed54ffd97cc8272f70a92f3",
+ "c2a8099dd85e42599911991b467a7afe",
+ "72d0effc5d0948378103da4b2c8da5ae",
+ "cf3ac6e0e69643639d6b0a2577fff71a",
+ "d8f4949af74342d3b72200484ee3f1fb",
+ "ff42d87d84694bb2a6a7e63e43750029",
+ "ae619521ac64447b91b9fb26c46e696a",
+ "62a20c9c11f4452389dfdde24fa90d03",
+ "cb94c6469891495db93c332e2b707299",
+ "4e0b6f1f2b2f497d9b6e0183b0bc7ade",
+ "999d0e74507b4acfae447018abb03323",
+ "eaa726bb3b9d45d29c011053e844a97e"
]
},
"id": "JKv9O8kfV2zZ",
- "outputId": "6893e79a-48f7-4713-c4a4-a9558acbcf7c"
+ "outputId": "c902fc89-7c47-4eca-da89-411bc5b5e501"
},
- "execution_count": 21,
+ "execution_count": 12,
"outputs": [
{
"output_type": "display_data",
@@ -5412,7 +5163,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "3747d0aa68d642449ff32b7efd47d497"
+ "model_id": "8e60f2b1a9f7455db02eb846af52df63"
}
},
"metadata": {}
@@ -5426,7 +5177,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "cf36c750119449e8a16aa97a9b66a124"
+ "model_id": "3fcb6b4a0c454d59a6d5503cec84ba37"
}
},
"metadata": {}
@@ -5440,7 +5191,7 @@
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
- "model_id": "9a04f6723e2a40288eb42eea0134dfaf"
+ "model_id": "c2a8099dd85e42599911991b467a7afe"
}
},
"metadata": {}
@@ -6192,7 +5943,7 @@
]
},
"metadata": {},
- "execution_count": 21
+ "execution_count": 12
}
]
},
@@ -6208,13 +5959,12 @@
{
"cell_type": "code",
"source": [
- "import datetime\n",
- "import numpy as np"
+ "import torch"
],
"metadata": {
- "id": "s-q6_F38bLVA"
+ "id": "rdWMg_KJZEZH"
},
- "execution_count": 22,
+ "execution_count": 13,
"outputs": []
},
{
@@ -6230,360 +5980,42 @@
" else:\n",
" results_false += 1.0\n",
"\n",
- " return results_ok / (results_ok + results_false)\n",
- "\n",
- "def format_time(elapsed):\n",
- " '''\n",
- " Takes a time in seconds and returns a string hh:mm:ss\n",
- " '''\n",
- " elapsed_rounded = int(round((elapsed)))\n",
- " return str(datetime.timedelta(seconds=elapsed_rounded))"
+ " return results_ok / (results_ok + results_false)"
],
"metadata": {
"id": "FzUi8908ax61"
},
- "execution_count": 23,
- "outputs": []
- },
- {
- "cell_type": "markdown",
- "source": [
- "# Init training"
- ],
- "metadata": {
- "id": "ucChBa-9bXJy"
- }
- },
- {
- "cell_type": "code",
- "source": [
- "from transformers import get_linear_schedule_with_warmup"
- ],
- "metadata": {
- "id": "c9e7rbGwbdEp"
- },
- "execution_count": 24,
+ "execution_count": 14,
"outputs": []
},
{
"cell_type": "code",
"source": [
- "optimizer = torch.optim.AdamW(model.parameters(),\n",
- " lr = 3e-4,\n",
- " eps = 1e-8\n",
- " )\n",
+ "if torch.cuda.is_available(): \n",
+ " device = torch.device(\"cuda\")\n",
"\n",
- "epochs = 4\n",
+ " print('There are %d GPU(s) available.' % torch.cuda.device_count())\n",
+ " print('We will use the GPU:', torch.cuda.get_device_name(0))\n",
"\n",
- "total_steps = len(train_dataloader) * epochs\n",
- "\n",
- "scheduler = get_linear_schedule_with_warmup(optimizer, \n",
- " num_warmup_steps = 0,\n",
- " num_training_steps = total_steps)"
- ],
- "metadata": {
- "id": "A7XUF4PNbYy8"
- },
- "execution_count": 25,
- "outputs": []
- },
- {
- "cell_type": "markdown",
- "source": [
- "# Training"
- ],
- "metadata": {
- "id": "DAzQWODja0A3"
- }
- },
- {
- "cell_type": "code",
- "source": [
- "import random\n",
- "import time"
- ],
- "metadata": {
- "id": "Hoa7NlU0bI7G"
- },
- "execution_count": 26,
- "outputs": []
- },
- {
- "cell_type": "code",
- "source": [
- "# This training code is based on the `run_glue.py` script here:\n",
- "# https://github.com/huggingface/transformers/blob/5bfcd0485ece086ebcbed2d008813037968a9e58/examples/run_glue.py#L128\n",
- "\n",
- "seed_val = 42\n",
- "\n",
- "random.seed(seed_val)\n",
- "np.random.seed(seed_val)\n",
- "torch.manual_seed(seed_val)\n",
- "torch.cuda.manual_seed_all(seed_val)\n",
- "\n",
- "training_stats = []\n",
- "total_t0 = time.time()\n",
- "\n",
- "for epoch_i in range(0, epochs):\n",
- " \n",
- " # ========================================\n",
- " # Training\n",
- " # ========================================\n",
- "\n",
- " print(\"\")\n",
- " print('======== Epoch {:} / {:} ========'.format(epoch_i + 1, epochs))\n",
- " print('Training...')\n",
- "\n",
- " t0 = time.time()\n",
- "\n",
- " total_train_loss = 0\n",
- " total_train_acc = 0\n",
- "\n",
- " model.train()\n",
- "\n",
- " for step, batch in enumerate(train_dataloader):\n",
- " if step % 40 == 0 and not step == 0:\n",
- " elapsed = format_time(time.time() - t0)\n",
- " print(' Batch {:>5,} of {:>5,}. Elapsed: {:}.'.format(step, len(train_dataloader), elapsed))\n",
- "\n",
- "\n",
- " b_input_ids = batch[0].to(device)\n",
- " b_input_mask = batch[1].to(device)\n",
- "\n",
- " y = batch[2].to(device)\n",
- " y_ids = y[:, :-1].contiguous()\n",
- " lm_labels = y[:, 1:].clone().detach()\n",
- " lm_labels[y[:, 1:] == tokenizer.pad_token_id] = -100\n",
- "\n",
- " model.zero_grad() \n",
- "\n",
- " outputs = model(\n",
- " input_ids=b_input_ids,\n",
- " attention_mask=b_input_mask,\n",
- " decoder_input_ids=y_ids,\n",
- " labels=lm_labels\n",
- " )\n",
- "\n",
- " generated_ids = model.generate(\n",
- " input_ids = b_input_ids,\n",
- " attention_mask = b_input_mask, \n",
- " max_length=2, \n",
- " num_beams=2,\n",
- " repetition_penalty=2.5, \n",
- " length_penalty=1.0, \n",
- " early_stopping=True\n",
- " )\n",
- "\n",
- " preds = [tokenizer.decode(g, skip_special_tokens=True, clean_up_tokenization_spaces=True) for g in generated_ids]\n",
- " target = [tokenizer.decode(t, skip_special_tokens=True, clean_up_tokenization_spaces=True) for t in y]\n",
- " total_train_acc += calculate_accuracy(preds, target) \n",
- "\n",
- " loss = outputs['loss']\n",
- " total_train_loss += loss.item()\n",
- "\n",
- " loss.backward()\n",
- " torch.nn.utils.clip_grad_norm_(model.parameters(), 1.0)\n",
- "\n",
- " optimizer.step()\n",
- " scheduler.step()\n",
- "\n",
- " avg_train_loss = total_train_loss / len(train_dataloader) \n",
- " avg_train_acc = total_train_acc / len(train_dataloader) \n",
- " \n",
- " training_time = format_time(time.time() - t0)\n",
- "\n",
- " print(\"\")\n",
- " print(\" Average training loss: {0:.2f}\".format(avg_train_loss))\n",
- " print(\" Average training acc: {0:.2f}\".format(avg_train_acc))\n",
- " print(\" Training epcoh took: {:}\".format(training_time))\n",
- " \n",
- " # ========================================\n",
- " # Validation\n",
- " # ========================================\n",
- "\n",
- " print(\"\")\n",
- " print(\"Running Validation...\")\n",
- "\n",
- " t0 = time.time()\n",
- " model.eval()\n",
- "\n",
- " total_eval_loss = 0\n",
- " total_eval_accuracy = 0\n",
- "\n",
- " for batch in validation_dataloader:\n",
- "\n",
- " b_input_ids = batch[0].to(device)\n",
- " b_input_mask = batch[1].to(device)\n",
- "\n",
- " y = batch[2].to(device)\n",
- " y_ids = y[:, :-1].contiguous()\n",
- " lm_labels = y[:, 1:].clone().detach()\n",
- " lm_labels[y[:, 1:] == tokenizer.pad_token_id] = -100\n",
- " \n",
- " with torch.no_grad(): \n",
- "\n",
- " outputs = model(\n",
- " input_ids=b_input_ids,\n",
- " attention_mask=b_input_mask,\n",
- " decoder_input_ids=y_ids,\n",
- " labels=lm_labels\n",
- " )\n",
- "\n",
- " loss = outputs['loss']\n",
- " total_eval_loss += loss.item()\n",
- "\n",
- " generated_ids = model.generate(\n",
- " input_ids = b_input_ids,\n",
- " attention_mask = b_input_mask, \n",
- " max_length=2, \n",
- " num_beams=2,\n",
- " repetition_penalty=2.5, \n",
- " length_penalty=1.0, \n",
- " early_stopping=True\n",
- " )\n",
- "\n",
- " preds = [tokenizer.decode(g, skip_special_tokens=True, clean_up_tokenization_spaces=True) for g in generated_ids]\n",
- " target = [tokenizer.decode(t, skip_special_tokens=True, clean_up_tokenization_spaces=True) for t in y]\n",
- " total_eval_accuracy += calculate_accuracy(preds, target) \n",
- "\n",
- " avg_val_loss = total_eval_loss / len(validation_dataloader)\n",
- "\n",
- " avg_val_accuracy = total_eval_accuracy / len(validation_dataloader)\n",
- " print(\" Accuracy: {0:.2f}\".format(avg_val_accuracy))\n",
- " \n",
- " validation_time = format_time(time.time() - t0)\n",
- " print(\" Validation took: {:}\".format(validation_time))\n",
- " print(\" Validation Loss: {0:.2f}\".format(avg_val_loss))\n",
- "\n",
- " training_stats.append(\n",
- " {\n",
- " 'epoch': epoch_i + 1,\n",
- " 'Training Loss': avg_train_loss,\n",
- " 'Training Accur.': avg_train_acc,\n",
- " 'Valid. Loss': avg_val_loss,\n",
- " 'Valid. Accur.': avg_val_accuracy,\n",
- " 'Training Time': training_time,\n",
- " 'Validation Time': validation_time\n",
- " }\n",
- " )\n",
- "\n",
- "print(\"\")\n",
- "print(\"Training complete!\")\n",
- "\n",
- "print(\"Total training took {:} (h:mm:ss)\".format(format_time(time.time()-total_t0)))"
+ "else:\n",
+ " print('No GPU available, using the CPU instead.')\n",
+ " device = torch.device(\"cpu\")"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
- "id": "xsHxfslka1u5",
- "outputId": "28c30ee0-6f41-4ede-eb3a-eebd4269c332"
+ "id": "86i7iRmtW-6L",
+ "outputId": "109072a9-ff0c-4ac0-fc74-4de30065af95"
},
- "execution_count": 27,
+ "execution_count": 15,
"outputs": [
{
"output_type": "stream",
"name": "stdout",
"text": [
- "\n",
- "======== Epoch 1 / 4 ========\n",
- "Training...\n",
- " Batch 40 of 515. Elapsed: 0:00:46.\n",
- " Batch 80 of 515. Elapsed: 0:01:30.\n",
- " Batch 120 of 515. Elapsed: 0:02:14.\n",
- " Batch 160 of 515. Elapsed: 0:02:59.\n",
- " Batch 200 of 515. Elapsed: 0:03:44.\n",
- " Batch 240 of 515. Elapsed: 0:04:28.\n",
- " Batch 280 of 515. Elapsed: 0:05:13.\n",
- " Batch 320 of 515. Elapsed: 0:05:57.\n",
- " Batch 360 of 515. Elapsed: 0:06:42.\n",
- " Batch 400 of 515. Elapsed: 0:07:26.\n",
- " Batch 440 of 515. Elapsed: 0:08:11.\n",
- " Batch 480 of 515. Elapsed: 0:08:55.\n",
- "\n",
- " Average training loss: 0.01\n",
- " Average training acc: 0.59\n",
- " Training epcoh took: 0:09:34\n",
- "\n",
- "Running Validation...\n",
- " Accuracy: 0.47\n",
- " Validation took: 0:00:31\n",
- " Validation Loss: 0.00\n",
- "\n",
- "======== Epoch 2 / 4 ========\n",
- "Training...\n",
- " Batch 40 of 515. Elapsed: 0:00:44.\n",
- " Batch 80 of 515. Elapsed: 0:01:29.\n",
- " Batch 120 of 515. Elapsed: 0:02:13.\n",
- " Batch 160 of 515. Elapsed: 0:02:58.\n",
- " Batch 200 of 515. Elapsed: 0:03:42.\n",
- " Batch 240 of 515. Elapsed: 0:04:27.\n",
- " Batch 280 of 515. Elapsed: 0:05:11.\n",
- " Batch 320 of 515. Elapsed: 0:05:56.\n",
- " Batch 360 of 515. Elapsed: 0:06:40.\n",
- " Batch 400 of 515. Elapsed: 0:07:25.\n",
- " Batch 440 of 515. Elapsed: 0:08:09.\n",
- " Batch 480 of 515. Elapsed: 0:08:54.\n",
- "\n",
- " Average training loss: 0.00\n",
- " Average training acc: 0.59\n",
- " Training epcoh took: 0:09:32\n",
- "\n",
- "Running Validation...\n",
- " Accuracy: 0.46\n",
- " Validation took: 0:00:31\n",
- " Validation Loss: 0.00\n",
- "\n",
- "======== Epoch 3 / 4 ========\n",
- "Training...\n",
- " Batch 40 of 515. Elapsed: 0:00:44.\n",
- " Batch 80 of 515. Elapsed: 0:01:34.\n",
- " Batch 120 of 515. Elapsed: 0:02:20.\n",
- " Batch 160 of 515. Elapsed: 0:03:05.\n",
- " Batch 200 of 515. Elapsed: 0:03:49.\n",
- " Batch 240 of 515. Elapsed: 0:04:34.\n",
- " Batch 280 of 515. Elapsed: 0:05:18.\n",
- " Batch 320 of 515. Elapsed: 0:06:03.\n",
- " Batch 360 of 515. Elapsed: 0:06:47.\n",
- " Batch 400 of 515. Elapsed: 0:07:32.\n",
- " Batch 440 of 515. Elapsed: 0:08:16.\n",
- " Batch 480 of 515. Elapsed: 0:09:00.\n",
- "\n",
- " Average training loss: 0.00\n",
- " Average training acc: 0.59\n",
- " Training epcoh took: 0:09:39\n",
- "\n",
- "Running Validation...\n",
- " Accuracy: 0.46\n",
- " Validation took: 0:00:31\n",
- " Validation Loss: 0.00\n",
- "\n",
- "======== Epoch 4 / 4 ========\n",
- "Training...\n",
- " Batch 40 of 515. Elapsed: 0:00:45.\n",
- " Batch 80 of 515. Elapsed: 0:01:29.\n",
- " Batch 120 of 515. Elapsed: 0:02:14.\n",
- " Batch 160 of 515. Elapsed: 0:02:58.\n",
- " Batch 200 of 515. Elapsed: 0:03:42.\n",
- " Batch 240 of 515. Elapsed: 0:04:27.\n",
- " Batch 280 of 515. Elapsed: 0:05:11.\n",
- " Batch 320 of 515. Elapsed: 0:05:56.\n",
- " Batch 360 of 515. Elapsed: 0:06:40.\n",
- " Batch 400 of 515. Elapsed: 0:07:24.\n",
- " Batch 440 of 515. Elapsed: 0:08:09.\n",
- " Batch 480 of 515. Elapsed: 0:08:53.\n",
- "\n",
- " Average training loss: 0.00\n",
- " Average training acc: 0.58\n",
- " Training epcoh took: 0:09:32\n",
- "\n",
- "Running Validation...\n",
- " Accuracy: 0.46\n",
- " Validation took: 0:00:31\n",
- " Validation Loss: 0.00\n",
- "\n",
- "Training complete!\n",
- "Total training took 0:40:22 (h:mm:ss)\n"
+ "There are 1 GPU(s) available.\n",
+ "We will use the GPU: Tesla T4\n"
]
}
]
@@ -6591,341 +6023,46 @@
{
"cell_type": "markdown",
"source": [
- "# Train summary"
+ "# Predykcja"
],
"metadata": {
- "id": "xIpFPoRb91Or"
+ "id": "H_YI3bS3VHQE"
}
},
{
"cell_type": "code",
"source": [
- "import pandas as pd\n",
+ "parsed_dataset = parsed_dataset[1:123] + parsed_dataset[124:2000] + parsed_dataset[2001:3002] + parsed_dataset[3003:]\n",
+ "predictions = []\n",
+ "expected = []\n",
"\n",
- "pd.set_option('precision', 2)\n",
- "df_stats = pd.DataFrame(data=training_stats)\n",
+ "for row in parsed_dataset:\n",
+ " input_text = few_shot_prefix + row['sms'] + \"\\nSpam: \"\n",
+ " input_ids = tokenizer(input_text, return_tensors=\"pt\").input_ids.to(device)\n",
"\n",
- "df_stats = df_stats.set_index('epoch')\n",
- "df_stats"
- ],
- "metadata": {
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 206
- },
- "id": "GjYqBrrO93Oh",
- "outputId": "0087ee68-c017-41fd-db84-ca6e0d25fb12"
- },
- "execution_count": 28,
- "outputs": [
- {
- "output_type": "execute_result",
- "data": {
- "text/plain": [
- " Training Loss Training Accur. Valid. Loss Valid. Accur. \\\n",
- "epoch \n",
- "1 5.27e-03 0.59 0.0 0.47 \n",
- "2 2.74e-08 0.59 0.0 0.46 \n",
- "3 1.58e-08 0.59 0.0 0.46 \n",
- "4 1.55e-08 0.58 0.0 0.46 \n",
- "\n",
- " Training Time Validation Time \n",
- "epoch \n",
- "1 0:09:34 0:00:31 \n",
- "2 0:09:32 0:00:31 \n",
- "3 0:09:39 0:00:31 \n",
- "4 0:09:32 0:00:31 "
- ],
- "text/html": [
- "\n",
- "
\n",
- "
\n",
- "
\n",
- "\n",
- "
\n",
- " \n",
- " \n",
- " | \n",
- " Training Loss | \n",
- " Training Accur. | \n",
- " Valid. Loss | \n",
- " Valid. Accur. | \n",
- " Training Time | \n",
- " Validation Time | \n",
- "
\n",
- " \n",
- " epoch | \n",
- " | \n",
- " | \n",
- " | \n",
- " | \n",
- " | \n",
- " | \n",
- "
\n",
- " \n",
- " \n",
- " \n",
- " 1 | \n",
- " 5.27e-03 | \n",
- " 0.59 | \n",
- " 0.0 | \n",
- " 0.47 | \n",
- " 0:09:34 | \n",
- " 0:00:31 | \n",
- "
\n",
- " \n",
- " 2 | \n",
- " 2.74e-08 | \n",
- " 0.59 | \n",
- " 0.0 | \n",
- " 0.46 | \n",
- " 0:09:32 | \n",
- " 0:00:31 | \n",
- "
\n",
- " \n",
- " 3 | \n",
- " 1.58e-08 | \n",
- " 0.59 | \n",
- " 0.0 | \n",
- " 0.46 | \n",
- " 0:09:39 | \n",
- " 0:00:31 | \n",
- "
\n",
- " \n",
- " 4 | \n",
- " 1.55e-08 | \n",
- " 0.58 | \n",
- " 0.0 | \n",
- " 0.46 | \n",
- " 0:09:32 | \n",
- " 0:00:31 | \n",
- "
\n",
- " \n",
- "
\n",
- "
\n",
- "
\n",
- " \n",
- " \n",
- "\n",
- " \n",
- "
\n",
- "
\n",
- " "
- ]
- },
- "metadata": {},
- "execution_count": 28
- }
- ]
- },
- {
- "cell_type": "code",
- "source": [
- "import matplotlib.pyplot as plt\n",
- "%matplotlib inline\n",
+ " generated_ids = model.generate(input_ids, do_sample=True, temperature=0.9, max_length=200)\n",
+ " generated_text = tokenizer.decode(generated_ids[0], skip_special_tokens=True, clean_up_tokenization_spaces=True)\n",
+ " \n",
+ " predictions.append(generated_text)\n",
+ " expected.append(row['label'])\n",
"\n",
- "import seaborn as sns\n",
- "\n",
- "sns.set(style='darkgrid')\n",
- "\n",
- "sns.set(font_scale=1.5)\n",
- "plt.rcParams[\"figure.figsize\"] = (12,6)\n",
- "\n",
- "plt.plot(df_stats['Training Loss'], 'b-o', label=\"Training\")\n",
- "plt.plot(df_stats['Valid. Loss'], 'g-o', label=\"Validation\")\n",
- "\n",
- "plt.title(\"Training & Validation Loss\")\n",
- "plt.xlabel(\"Epoch\")\n",
- "plt.ylabel(\"Loss\")\n",
- "plt.legend()\n",
- "plt.xticks([1, 2, 3, 4])\n",
- "\n",
- "plt.show()"
- ],
- "metadata": {
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 427
- },
- "id": "Xk3gzkeU96v3",
- "outputId": "aa447af5-09f3-4bc2-e234-8a74bba87c05"
- },
- "execution_count": 29,
- "outputs": [
- {
- "output_type": "display_data",
- "data": {
- "text/plain": [
- "