Przetwarzanie_tekstu/projekt/FLAN-T5_experiments/Ver_4_FLAN-T5_sms_spam.ipynb

1 line
200 KiB
Plaintext
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"provenance":[]},"kernelspec":{"name":"python3","display_name":"Python 3"},"language_info":{"name":"python"},"gpuClass":"standard","widgets":{"application/vnd.jupyter.widget-state+json":{"68bd37fea6b9499daec358ce41d9d678":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_c2be6591c7ff4d4daf26ccd12f1844af","IPY_MODEL_adf02588e5184537a93169222740dd3d","IPY_MODEL_622e16eeafb74e939e0c69d492aa604e"],"layout":"IPY_MODEL_18d424bf759a4996984075b098834129"}},"c2be6591c7ff4d4daf26ccd12f1844af":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_48546da0c5504023b1209c01b25d4e4c","placeholder":"","style":"IPY_MODEL_c95964f713a8408593c599c189dc4ad7","value":"Downloading builder script: 100%"}},"adf02588e5184537a93169222740dd3d":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_61c14a3d13524b4aa5ed7942390fb1da","max":3208,"min":0,"orientation":"horizontal","style":"IPY_MODEL_c1104de7b8db49789ec58adfc7bfe215","value":3208}},"622e16eeafb74e939e0c69d492aa604e":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e3eb39ab40684052b3558938d2955d1b","placeholder":"","style":"IPY_MODEL_5ad9640c999948cf930de2c024c7c81c","value":" 3.21k/3.21k [00:00&lt;00:00, 157kB/s]"}},"18d424bf759a4996984075b098834129":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"48546da0c5504023b1209c01b25d4e4c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c95964f713a8408593c599c189dc4ad7":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"61c14a3d13524b4aa5ed7942390fb1da":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c1104de7b8db49789ec58adfc7bfe215":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"e3eb39ab40684052b3558938d2955d1b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5ad9640c999948cf930de2c024c7c81c":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"361b829c01d94f028fd511602401b630":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_b0500d4eb22e470382d692e1dc91d6b5","IPY_MODEL_58912ae770724c56a55212c37502572b","IPY_MODEL_d5ad570f7f4f4cb49b258001d4ac1b58"],"layout":"IPY_MODEL_d0ec3fa6ab724b368df4ab862c5b7b1b"}},"b0500d4eb22e470382d692e1dc91d6b5":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_246e37be5003475a8e682e7797fa7db0","placeholder":"","style":"IPY_MODEL_ddce8b1ecabe492684b70a3fd8fad029","value":"Downloading metadata: 100%"}},"58912ae770724c56a55212c37502572b":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_a254ee7123ec411cb0076b6a15397281","max":1687,"min":0,"orientation":"horizontal","style":"IPY_MODEL_d239e3573e904b51b834cfa5d6e9e3af","value":1687}},"d5ad570f7f4f4cb49b258001d4ac1b58":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e58081a3ec5141ae88bf49a08e3771b5","placeholder":"","style":"IPY_MODEL_ece5328c3eab49ea8148efca475f5eb8","value":" 1.69k/1.69k [00:00&lt;00:00, 30.0kB/s]"}},"d0ec3fa6ab724b368df4ab862c5b7b1b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"246e37be5003475a8e682e7797fa7db0":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ddce8b1ecabe492684b70a3fd8fad029":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"a254ee7123ec411cb0076b6a15397281":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d239e3573e904b51b834cfa5d6e9e3af":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"e58081a3ec5141ae88bf49a08e3771b5":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ece5328c3eab49ea8148efca475f5eb8":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"12e031e63c4b4753b19c2f262cf6550c":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_664490b6e48c4e09a37957ea2a32705c","IPY_MODEL_ed9152228e864e02b956dc345ced59ad","IPY_MODEL_130c35b0aef541409fdd1e7b6d33004a"],"layout":"IPY_MODEL_ef4757d97869447f8192346626730277"}},"664490b6e48c4e09a37957ea2a32705c":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_932e3c5942ac450ab7245d370b410a39","placeholder":"","style":"IPY_MODEL_09ed8501e44441b0af5fa6d549abb776","value":"Downloading readme: 100%"}},"ed9152228e864e02b956dc345ced59ad":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_4e4f6641562a4741afdefebfb04c3ca3","max":4872,"min":0,"orientation":"horizontal","style":"IPY_MODEL_a48363c76a424855b178ef5ecc6be3c0","value":4872}},"130c35b0aef541409fdd1e7b6d33004a":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_904f59209b524551bd629944d870bd44","placeholder":"","style":"IPY_MODEL_721fa15e35844743880b72ab03243309","value":" 4.87k/4.87k [00:00&lt;00:00, 234kB/s]"}},"ef4757d97869447f8192346626730277":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"932e3c5942ac450ab7245d370b410a39":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"09ed8501e44441b0af5fa6d549abb776":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"4e4f6641562a4741afdefebfb04c3ca3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"a48363c76a424855b178ef5ecc6be3c0":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"904f59209b524551bd629944d870bd44":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"721fa15e35844743880b72ab03243309":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"6557e65a8adc45efab4ef47a50653bf0":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_0adbedaa248e4eabb6110fde0e32b75e","IPY_MODEL_42156b19be1848e7b6ea19874821fbb9","IPY_MODEL_9911649dc95b46c2a9c04be1e0fa7861"],"layout":"IPY_MODEL_0423daad31da47979f84c546d698480c"}},"0adbedaa248e4eabb6110fde0e32b75e":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_7e452481918f485f9901108b8dc9db77","placeholder":"","style":"IPY_MODEL_9049707729a14ff1862939f7aec876ab","value":"Downloading data: 100%"}},"42156b19be1848e7b6ea19874821fbb9":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_ddc0eb506b544e85b999f11566162679","max":203415,"min":0,"orientation":"horizontal","style":"IPY_MODEL_a0cf1620ed6b4ea39d57690f7a2c273c","value":203415}},"9911649dc95b46c2a9c04be1e0fa7861":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_bf7d7c639ca942228ae14179798b5821","placeholder":"","style":"IPY_MODEL_840d8a832c8f4a25960ffed3705ce99b","value":" 203k/203k [00:00&lt;00:00, 749kB/s]"}},"0423daad31da47979f84c546d698480c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"7e452481918f485f9901108b8dc9db77":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"9049707729a14ff1862939f7aec876ab":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ddc0eb506b544e85b999f11566162679":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"a0cf1620ed6b4ea39d57690f7a2c273c":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"bf7d7c639ca942228ae14179798b5821":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"840d8a832c8f4a25960ffed3705ce99b":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"4ac215662d6f40a28a7998911fb617f0":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_75d0debcd9104328b5ce905d0cf95d05","IPY_MODEL_d47951f821724274a88cd5f157e9224d","IPY_MODEL_82982684fd9341ac92223f30cbea8412"],"layout":"IPY_MODEL_c9df05e8f8f94302b1a61129a0b79ab6"}},"75d0debcd9104328b5ce905d0cf95d05":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_df3bc60cf37d422bbe8e55a9093499e5","placeholder":"","style":"IPY_MODEL_c1e6db93577a478d9192fd4a9c03a439","value":"Generating train split: 100%"}},"d47951f821724274a88cd5f157e9224d":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"","description":"","description_tooltip":null,"layout":"IPY_MODEL_9e61eda06ddf43a8997f4ca69f58dbdb","max":5574,"min":0,"orientation":"horizontal","style":"IPY_MODEL_11e8310afe6e4d6288d1e7e285a880bb","value":5574}},"82982684fd9341ac92223f30cbea8412":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e42e05102ce144758c58874f21c9e2f2","placeholder":"","style":"IPY_MODEL_c9b324922b424052b3d9cefadc921c27","value":" 5574/5574 [00:00&lt;00:00, 15020.97 examples/s]"}},"c9df05e8f8f94302b1a61129a0b79ab6":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":"hidden","width":null}},"df3bc60cf37d422bbe8e55a9093499e5":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c1e6db93577a478d9192fd4a9c03a439":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"9e61eda06ddf43a8997f4ca69f58dbdb":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"11e8310afe6e4d6288d1e7e285a880bb":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"e42e05102ce144758c58874f21c9e2f2":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c9b324922b424052b3d9cefadc921c27":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"6190bdcfdbad409698f1d0f525d4325f":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_81478adafe094101aa5444721a77013a","IPY_MODEL_423f9593f9894680bbf4dcc4dd2ef724","IPY_MODEL_25d37d0fbc3a4917b4421b3b67f9c4e5"],"layout":"IPY_MODEL_be15f6e1f9d74ac5be7457e4c6edccd0"}},"81478adafe094101aa5444721a77013a":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_19f31506f4d140beb5c7ac6076f83b47","placeholder":"","style":"IPY_MODEL_8858842842fe4aa3be0c11e80aa65d3a","value":"100%"}},"423f9593f9894680bbf4dcc4dd2ef724":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_78d9b1024b214602b0a8c6d15d35a89d","max":1,"min":0,"orientation":"horizontal","style":"IPY_MODEL_678aa3d231d44c0c9ffb6c38e9e095f6","value":1}},"25d37d0fbc3a4917b4421b3b67f9c4e5":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e789a3898f8c41c2bdf8ea5748b18104","placeholder":"","style":"IPY_MODEL_eea178b6106448bca7ea2b9f2eae6527","value":" 1/1 [00:00&lt;00:00, 31.02it/s]"}},"be15f6e1f9d74ac5be7457e4c6edccd0":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"19f31506f4d140beb5c7ac6076f83b47":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"8858842842fe4aa3be0c11e80aa65d3a":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"78d9b1024b214602b0a8c6d15d35a89d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"678aa3d231d44c0c9ffb6c38e9e095f6":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"e789a3898f8c41c2bdf8ea5748b18104":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"eea178b6106448bca7ea2b9f2eae6527":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"6a27116f01b648ef942141677975405d":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_6640b97f0817419c98a633e83eb854f6","IPY_MODEL_17f50238e442461b873192ed1a7e5673","IPY_MODEL_0bc47b507ae64766958ec4062359d962"],"layout":"IPY_MODEL_c4b010d66ba4491083f26a1cd0fd0b09"}},"6640b97f0817419c98a633e83eb854f6":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_9f6d9358f00445518e118e084bd8c192","placeholder":"","style":"IPY_MODEL_8b97c4b26c4145c58a8efc1cfd31042c","value":"Downloading (…)okenizer_config.json: 100%"}},"17f50238e442461b873192ed1a7e5673":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_565f2dc27a8c43a6b85b87efa558bdf5","max":2539,"min":0,"orientation":"horizontal","style":"IPY_MODEL_0e8794c1d221420d9a306e7d35a3d63e","value":2539}},"0bc47b507ae64766958ec4062359d962":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_8d04dd43e8024043b63e98b7caa3c97b","placeholder":"","style":"IPY_MODEL_099201033c6e461088795edc27470c09","value":" 2.54k/2.54k [00:00&lt;00:00, 68.8kB/s]"}},"c4b010d66ba4491083f26a1cd0fd0b09":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"9f6d9358f00445518e118e084bd8c192":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"8b97c4b26c4145c58a8efc1cfd31042c":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"565f2dc27a8c43a6b85b87efa558bdf5":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"0e8794c1d221420d9a306e7d35a3d63e":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"8d04dd43e8024043b63e98b7caa3c97b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"099201033c6e461088795edc27470c09":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"d195065e792b496fa0674d96d80bc5e7":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_ef3744a453a74cbc907467a121cabdc7","IPY_MODEL_59c8487d5d1441c2ad888c96b62b2fc6","IPY_MODEL_c88f9cfc8c8846499bac0faace319921"],"layout":"IPY_MODEL_438c39c7c97e4172a8c4e4c29e0dde86"}},"ef3744a453a74cbc907467a121cabdc7":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e4244f9bd21a4f8caa038e1922cdac85","placeholder":"","style":"IPY_MODEL_53d371fdcd4c47cdbb60b68e14693c18","value":"Downloading (…)&quot;spiece.model&quot;;: 100%"}},"59c8487d5d1441c2ad888c96b62b2fc6":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_24225d17f2c24048aba70043851fc616","max":791656,"min":0,"orientation":"horizontal","style":"IPY_MODEL_7f13470e9f874a859edd3ad81dc2eef3","value":791656}},"c88f9cfc8c8846499bac0faace319921":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_65503a9084df4525a199b732b8b56478","placeholder":"","style":"IPY_MODEL_20a51f65184b41878c4938609b48ca6c","value":" 792k/792k [00:00&lt;00:00, 6.51MB/s]"}},"438c39c7c97e4172a8c4e4c29e0dde86":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e4244f9bd21a4f8caa038e1922cdac85":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"53d371fdcd4c47cdbb60b68e14693c18":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"24225d17f2c24048aba70043851fc616":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"7f13470e9f874a859edd3ad81dc2eef3":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"65503a9084df4525a199b732b8b56478":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"20a51f65184b41878c4938609b48ca6c":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"2ea815fd8b3f4d0883166e93ad3c5289":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_1361a74b2aef49ea98deafe7027bd568","IPY_MODEL_d532b5fe357a401da221671ff12c8904","IPY_MODEL_a8e5ad44d09c4e2189719bef46e7a39f"],"layout":"IPY_MODEL_0e0e1632da714b19b8baef34c1210473"}},"1361a74b2aef49ea98deafe7027bd568":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_aba6113b613d458abd74686aeae13657","placeholder":"","style":"IPY_MODEL_729afdc7fb37406ca334d8fb8a77e58a","value":"Downloading (…)/main/tokenizer.json: 100%"}},"d532b5fe357a401da221671ff12c8904":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_3b65129b567b44019e0b37c8401b8ed2","max":2424064,"min":0,"orientation":"horizontal","style":"IPY_MODEL_ed353f256ab6492891bf10d32f051e45","value":2424064}},"a8e5ad44d09c4e2189719bef46e7a39f":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_bbaf656fa94f413b959797d47353a049","placeholder":"","style":"IPY_MODEL_b659b1d8cc544a608200d5ef5076818e","value":" 2.42M/2.42M [00:00&lt;00:00, 17.7MB/s]"}},"0e0e1632da714b19b8baef34c1210473":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"aba6113b613d458abd74686aeae13657":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"729afdc7fb37406ca334d8fb8a77e58a":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"3b65129b567b44019e0b37c8401b8ed2":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ed353f256ab6492891bf10d32f051e45":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"bbaf656fa94f413b959797d47353a049":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"b659b1d8cc544a608200d5ef5076818e":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"497cde8c9a81401f92afa18ba9a6ce40":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_45ad6503850542a8a2f7a3b0479e88ca","IPY_MODEL_d276f99074864c0cbcd8daa17e5f6d2f","IPY_MODEL_04cebfae2d984f07a97351116037e3cf"],"layout":"IPY_MODEL_c94595332c0c4f18afde731efbaba866"}},"45ad6503850542a8a2f7a3b0479e88ca":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_587bdb3634a24c638696bcd9fe21368c","placeholder":"","style":"IPY_MODEL_dc450f9305da4afcbb4e6a1bf77c3590","value":"Downloading (…)cial_tokens_map.json: 100%"}},"d276f99074864c0cbcd8daa17e5f6d2f":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_884ace4175f94127b1674352d17e67f2","max":2201,"min":0,"orientation":"horizontal","style":"IPY_MODEL_3901be176ed144b986f20a7a7a72f8e2","value":2201}},"04cebfae2d984f07a97351116037e3cf":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_7259afa2646a414ebb90f486242e3661","placeholder":"","style":"IPY_MODEL_a09e4534caef4b43862c275a59617c6b","value":" 2.20k/2.20k [00:00&lt;00:00, 115kB/s]"}},"c94595332c0c4f18afde731efbaba866":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"587bdb3634a24c638696bcd9fe21368c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"dc450f9305da4afcbb4e6a1bf77c3590":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"884ace4175f94127b1674352d17e67f2":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"3901be176ed144b986f20a7a7a72f8e2":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"7259afa2646a414ebb90f486242e3661":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"a09e4534caef4b43862c275a59617c6b":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"8e0c9ce977054a879a1929e1c030a6a3":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_bde5c3406f0e46d8ab30a8b9f1355d5c","IPY_MODEL_91505f004c3742e68e9a70155fedcf2e","IPY_MODEL_0a7e5af5e2b64c488432b9563401c299"],"layout":"IPY_MODEL_4c8fd9d5d7364812900f4e35490948fd"}},"bde5c3406f0e46d8ab30a8b9f1355d5c":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_64d4b67445c34a6182c2b1ec07339b22","placeholder":"","style":"IPY_MODEL_c4f9e0afdb334188abaee11b383a0142","value":"Downloading (…)lve/main/config.json: 100%"}},"91505f004c3742e68e9a70155fedcf2e":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_8ce37c30b02646148b9694a14e21fbce","max":662,"min":0,"orientation":"horizontal","style":"IPY_MODEL_6a3fff3870b34941b4713c984c3c681c","value":662}},"0a7e5af5e2b64c488432b9563401c299":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_5ba546d284b04dee96c132985a8bd38c","placeholder":"","style":"IPY_MODEL_534b173a13c544e48af4051d748b89b8","value":" 662/662 [00:00&lt;00:00, 20.6kB/s]"}},"4c8fd9d5d7364812900f4e35490948fd":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"64d4b67445c34a6182c2b1ec07339b22":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c4f9e0afdb334188abaee11b383a0142":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"8ce37c30b02646148b9694a14e21fbce":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"6a3fff3870b34941b4713c984c3c681c":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"5ba546d284b04dee96c132985a8bd38c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"534b173a13c544e48af4051d748b89b8":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"2c7e377fed4241fbab8730fd850f5905":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_1c7b9fccd53043c0a9d84ae3c6caabd4","IPY_MODEL_e0423e68cdf64c8cb0e2643c20c8f3cd","IPY_MODEL_440dbb34f66a4ea8b4138da6dcb7d269"],"layout":"IPY_MODEL_d55e16b317a348fdb8f677cc5cab99cb"}},"1c7b9fccd53043c0a9d84ae3c6caabd4":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_f17117c9c86141e89c394b598f1c391a","placeholder":"","style":"IPY_MODEL_7635e183b25f42499d438febea66e8ea","value":"Downloading (…)&quot;pytorch_model.bin&quot;;: 100%"}},"e0423e68cdf64c8cb0e2643c20c8f3cd":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_bcc42f2b6d3847b5b9127503f09c805d","max":3132781861,"min":0,"orientation":"horizontal","style":"IPY_MODEL_95b7176944d74bed8d65239f0dd572cc","value":3132781861}},"440dbb34f66a4ea8b4138da6dcb7d269":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_a680a0a6142f4b86bd4b926320ded47c","placeholder":"","style":"IPY_MODEL_3a80de03299742baa8a05a6f6dc11e65","value":" 3.13G/3.13G [00:28&lt;00:00, 104MB/s]"}},"d55e16b317a348fdb8f677cc5cab99cb":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"f17117c9c86141e89c394b598f1c391a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"7635e183b25f42499d438febea66e8ea":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"bcc42f2b6d3847b5b9127503f09c805d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"95b7176944d74bed8d65239f0dd572cc":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"a680a0a6142f4b86bd4b926320ded47c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"3a80de03299742baa8a05a6f6dc11e65":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"c707fedbf7564e6195c9339dd850a29a":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_9de390b272414e62a761112ab5f6f2c5","IPY_MODEL_97c6386f6734441cbf30b8cd92e618fe","IPY_MODEL_70dfc5bbac0145e097ff98485435ae37"],"layout":"IPY_MODEL_d18f22d2d3274b57a622ffc8aed5b745"}},"9de390b272414e62a761112ab5f6f2c5":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_452dc83d4775438dbd6f5d70b0a9c281","placeholder":"","style":"IPY_MODEL_24ce51b9d54f4203bd402280ad319bbd","value":"Downloading (…)neration_config.json: 100%"}},"97c6386f6734441cbf30b8cd92e618fe":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_582ac43518ca4ea7ae2a34e0cd705471","max":147,"min":0,"orientation":"horizontal","style":"IPY_MODEL_48eed9b0ef6a45b9a32e22b468a14d60","value":147}},"70dfc5bbac0145e097ff98485435ae37":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_f8372f868b054d3798eaf1e1f4c40838","placeholder":"","style":"IPY_MODEL_105d6b2a260848849b6fed4593d4a8d8","value":" 147/147 [00:00&lt;00:00, 4.65kB/s]"}},"d18f22d2d3274b57a622ffc8aed5b745":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"452dc83d4775438dbd6f5d70b0a9c281":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"24ce51b9d54f4203bd402280ad319bbd":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"582ac43518ca4ea7ae2a34e0cd705471":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"48eed9b0ef6a45b9a32e22b468a14d60":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"f8372f868b054d3798eaf1e1f4c40838":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"105d6b2a260848849b6fed4593d4a8d8":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}}}},"accelerator":"GPU"},"cells":[{"cell_type":"markdown","source":["# Instalacja pakietów"],"metadata":{"id":"ZXsOR6oJOJbd"}},{"cell_type":"code","execution_count":1,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"8l0hzptKNiZS","executionInfo":{"status":"ok","timestamp":1676654821493,"user_tz":-60,"elapsed":23173,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"37414816-ea90-4a00-fe06-20fab2ab1b8f"},"outputs":[{"output_type":"stream","name":"stdout","text":["Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n","Collecting transformers\n"," Downloading transformers-4.26.1-py3-none-any.whl (6.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m6.3/6.3 MB\u001b[0m \u001b[31m34.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting datasets\n"," Downloading datasets-2.9.0-py3-none-any.whl (462 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m462.8/462.8 KB\u001b[0m \u001b[31m27.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: torch in /usr/local/lib/python3.8/dist-packages (1.13.1+cu116)\n","Collecting sentencepiece\n"," Downloading sentencepiece-0.1.97-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m52.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.8/dist-packages (from transformers) (4.64.1)\n","Requirement already satisfied: filelock in /usr/local/lib/python3.8/dist-packages (from transformers) (3.9.0)\n","Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.8/dist-packages (from transformers) (2022.6.2)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.8/dist-packages (from transformers) (6.0)\n","Collecting huggingface-hub<1.0,>=0.11.0\n"," Downloading huggingface_hub-0.12.1-py3-none-any.whl (190 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m190.3/190.3 KB\u001b[0m \u001b[31m15.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.8/dist-packages (from transformers) (1.21.6)\n","Requirement already satisfied: requests in /usr/local/lib/python3.8/dist-packages (from transformers) (2.25.1)\n","Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.8/dist-packages (from transformers) (23.0)\n","Collecting tokenizers!=0.11.3,<0.14,>=0.11.1\n"," Downloading tokenizers-0.13.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.6 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.6/7.6 MB\u001b[0m \u001b[31m55.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting responses<0.19\n"," Downloading responses-0.18.0-py3-none-any.whl (38 kB)\n","Requirement already satisfied: dill<0.3.7 in /usr/local/lib/python3.8/dist-packages (from datasets) (0.3.6)\n","Requirement already satisfied: pandas in /usr/local/lib/python3.8/dist-packages (from datasets) (1.3.5)\n","Requirement already satisfied: fsspec[http]>=2021.11.1 in /usr/local/lib/python3.8/dist-packages (from datasets) (2023.1.0)\n","Collecting multiprocess\n"," Downloading multiprocess-0.70.14-py38-none-any.whl (132 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m132.0/132.0 KB\u001b[0m \u001b[31m8.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: pyarrow>=6.0.0 in /usr/local/lib/python3.8/dist-packages (from datasets) (9.0.0)\n","Requirement already satisfied: aiohttp in /usr/local/lib/python3.8/dist-packages (from datasets) (3.8.3)\n","Collecting xxhash\n"," Downloading xxhash-3.2.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (213 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m213.0/213.0 KB\u001b[0m \u001b[31m9.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: typing-extensions in /usr/local/lib/python3.8/dist-packages (from torch) (4.4.0)\n","Requirement already satisfied: charset-normalizer<3.0,>=2.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (2.1.1)\n","Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (22.2.0)\n","Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.3.3)\n","Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.3.1)\n","Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.8.2)\n","Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (4.0.2)\n","Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (6.0.4)\n","Requirement already satisfied: chardet<5,>=3.0.2 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (4.0.0)\n","Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (1.24.3)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (2022.12.7)\n","Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (2.10)\n","Collecting urllib3<1.27,>=1.21.1\n"," Downloading urllib3-1.26.14-py2.py3-none-any.whl (140 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m140.6/140.6 KB\u001b[0m \u001b[31m10.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: python-dateutil>=2.7.3 in /usr/local/lib/python3.8/dist-packages (from pandas->datasets) (2.8.2)\n","Requirement already satisfied: pytz>=2017.3 in /usr/local/lib/python3.8/dist-packages (from pandas->datasets) (2022.7.1)\n","Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.8/dist-packages (from python-dateutil>=2.7.3->pandas->datasets) (1.15.0)\n","Installing collected packages: tokenizers, sentencepiece, xxhash, urllib3, multiprocess, responses, huggingface-hub, transformers, datasets\n"," Attempting uninstall: urllib3\n"," Found existing installation: urllib3 1.24.3\n"," Uninstalling urllib3-1.24.3:\n"," Successfully uninstalled urllib3-1.24.3\n","Successfully installed datasets-2.9.0 huggingface-hub-0.12.1 multiprocess-0.70.14 responses-0.18.0 sentencepiece-0.1.97 tokenizers-0.13.2 transformers-4.26.1 urllib3-1.26.14 xxhash-3.2.0\n"]}],"source":["!pip install transformers datasets torch sentencepiece"]},{"cell_type":"markdown","source":["# Załadowanie datasetu"],"metadata":{"id":"dhN0rmb5Oi3d"}},{"cell_type":"code","source":["from datasets import load_dataset"],"metadata":{"id":"tnaDkwZ2Pbnn","executionInfo":{"status":"ok","timestamp":1676654822469,"user_tz":-60,"elapsed":980,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}}},"execution_count":2,"outputs":[]},{"cell_type":"code","source":["dataset = load_dataset(\"sms_spam\")"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":264,"referenced_widgets":["68bd37fea6b9499daec358ce41d9d678","c2be6591c7ff4d4daf26ccd12f1844af","adf02588e5184537a93169222740dd3d","622e16eeafb74e939e0c69d492aa604e","18d424bf759a4996984075b098834129","48546da0c5504023b1209c01b25d4e4c","c95964f713a8408593c599c189dc4ad7","61c14a3d13524b4aa5ed7942390fb1da","c1104de7b8db49789ec58adfc7bfe215","e3eb39ab40684052b3558938d2955d1b","5ad9640c999948cf930de2c024c7c81c","361b829c01d94f028fd511602401b630","b0500d4eb22e470382d692e1dc91d6b5","58912ae770724c56a55212c37502572b","d5ad570f7f4f4cb49b258001d4ac1b58","d0ec3fa6ab724b368df4ab862c5b7b1b","246e37be5003475a8e682e7797fa7db0","ddce8b1ecabe492684b70a3fd8fad029","a254ee7123ec411cb0076b6a15397281","d239e3573e904b51b834cfa5d6e9e3af","e58081a3ec5141ae88bf49a08e3771b5","ece5328c3eab49ea8148efca475f5eb8","12e031e63c4b4753b19c2f262cf6550c","664490b6e48c4e09a37957ea2a32705c","ed9152228e864e02b956dc345ced59ad","130c35b0aef541409fdd1e7b6d33004a","ef4757d97869447f8192346626730277","932e3c5942ac450ab7245d370b410a39","09ed8501e44441b0af5fa6d549abb776","4e4f6641562a4741afdefebfb04c3ca3","a48363c76a424855b178ef5ecc6be3c0","904f59209b524551bd629944d870bd44","721fa15e35844743880b72ab03243309","6557e65a8adc45efab4ef47a50653bf0","0adbedaa248e4eabb6110fde0e32b75e","42156b19be1848e7b6ea19874821fbb9","9911649dc95b46c2a9c04be1e0fa7861","0423daad31da47979f84c546d698480c","7e452481918f485f9901108b8dc9db77","9049707729a14ff1862939f7aec876ab","ddc0eb506b544e85b999f11566162679","a0cf1620ed6b4ea39d57690f7a2c273c","bf7d7c639ca942228ae14179798b5821","840d8a832c8f4a25960ffed3705ce99b","4ac215662d6f40a28a7998911fb617f0","75d0debcd9104328b5ce905d0cf95d05","d47951f821724274a88cd5f157e9224d","82982684fd9341ac92223f30cbea8412","c9df05e8f8f94302b1a61129a0b79ab6","df3bc60cf37d422bbe8e55a9093499e5","c1e6db93577a478d9192fd4a9c03a439","9e61eda06ddf43a8997f4ca69f58dbdb","11e8310afe6e4d6288d1e7e285a880bb","e42e05102ce144758c58874f21c9e2f2","c9b324922b424052b3d9cefadc921c27","6190bdcfdbad409698f1d0f525d4325f","81478adafe094101aa5444721a77013a","423f9593f9894680bbf4dcc4dd2ef724","25d37d0fbc3a4917b4421b3b67f9c4e5","be15f6e1f9d74ac5be7457e4c6edccd0","19f31506f4d140beb5c7ac6076f83b47","8858842842fe4aa3be0c11e80aa65d3a","78d9b1024b214602b0a8c6d15d35a89d","678aa3d231d44c0c9ffb6c38e9e095f6","e789a3898f8c41c2bdf8ea5748b18104","eea178b6106448bca7ea2b9f2eae6527"]},"id":"cCiAuRqrOkvV","executionInfo":{"status":"ok","timestamp":1676654825207,"user_tz":-60,"elapsed":2740,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"d33d75f6-a30c-4fb1-c510-e9cba7cfe403"},"execution_count":3,"outputs":[{"output_type":"display_data","data":{"text/plain":["Downloading builder script: 0%| | 0.00/3.21k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"68bd37fea6b9499daec358ce41d9d678"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading metadata: 0%| | 0.00/1.69k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"361b829c01d94f028fd511602401b630"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading readme: 0%| | 0.00/4.87k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"12e031e63c4b4753b19c2f262cf6550c"}},"metadata":{}},{"output_type":"stream","name":"stdout","text":["Downloading and preparing dataset sms_spam/plain_text to /root/.cache/huggingface/datasets/sms_spam/plain_text/1.0.0/53f051d3b5f62d99d61792c91acefe4f1577ad3e4c216fb0ad39e30b9f20019c...\n"]},{"output_type":"display_data","data":{"text/plain":["Downloading data: 0%| | 0.00/203k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"6557e65a8adc45efab4ef47a50653bf0"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Generating train split: 0%| | 0/5574 [00:00<?, ? examples/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"4ac215662d6f40a28a7998911fb617f0"}},"metadata":{}},{"output_type":"stream","name":"stdout","text":["Dataset sms_spam downloaded and prepared to /root/.cache/huggingface/datasets/sms_spam/plain_text/1.0.0/53f051d3b5f62d99d61792c91acefe4f1577ad3e4c216fb0ad39e30b9f20019c. Subsequent calls will reuse this data.\n"]},{"output_type":"display_data","data":{"text/plain":[" 0%| | 0/1 [00:00<?, ?it/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"6190bdcfdbad409698f1d0f525d4325f"}},"metadata":{}}]},{"cell_type":"code","source":["dataset['train'][0]"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"JKFHPko3OnAV","executionInfo":{"status":"ok","timestamp":1676654825208,"user_tz":-60,"elapsed":10,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"c26256d4-313b-4993-d98a-27bcde4f71a5"},"execution_count":4,"outputs":[{"output_type":"execute_result","data":{"text/plain":["{'sms': 'Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\\n',\n"," 'label': 0}"]},"metadata":{},"execution_count":4}]},{"cell_type":"markdown","source":["# Przygotowanie datasetu"],"metadata":{"id":"l140vJrgYxPr"}},{"cell_type":"code","source":["parsed_dataset = []\n","\n","for row in dataset['train']:\n"," text = row['sms'].replace(\"\\n\", \"\")\n"," new_row = {}\n"," new_row['sms'] = text\n"," if row['label'] == 0:\n"," new_row['label'] = \"False\"\n"," else:\n"," new_row['label'] = \"True\"\n"," parsed_dataset.append(new_row)\n","\n","parsed_dataset[0]"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"1boUF-YiY3_y","executionInfo":{"status":"ok","timestamp":1676654825208,"user_tz":-60,"elapsed":8,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"fca5e196-7cb5-4c25-8fbb-e8becc020a88"},"execution_count":5,"outputs":[{"output_type":"execute_result","data":{"text/plain":["{'sms': 'Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...',\n"," 'label': 'False'}"]},"metadata":{},"execution_count":5}]},{"cell_type":"markdown","source":["# Tokenizer FLAN-T5"],"metadata":{"id":"O-J-jBDxPJcn"}},{"cell_type":"code","source":["from transformers import AutoTokenizer"],"metadata":{"id":"P23AYPX1PZ6g","executionInfo":{"status":"ok","timestamp":1676654827189,"user_tz":-60,"elapsed":1987,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}}},"execution_count":6,"outputs":[]},{"cell_type":"code","source":["tokenizer = AutoTokenizer.from_pretrained('google/flan-t5-large')"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":145,"referenced_widgets":["6a27116f01b648ef942141677975405d","6640b97f0817419c98a633e83eb854f6","17f50238e442461b873192ed1a7e5673","0bc47b507ae64766958ec4062359d962","c4b010d66ba4491083f26a1cd0fd0b09","9f6d9358f00445518e118e084bd8c192","8b97c4b26c4145c58a8efc1cfd31042c","565f2dc27a8c43a6b85b87efa558bdf5","0e8794c1d221420d9a306e7d35a3d63e","8d04dd43e8024043b63e98b7caa3c97b","099201033c6e461088795edc27470c09","d195065e792b496fa0674d96d80bc5e7","ef3744a453a74cbc907467a121cabdc7","59c8487d5d1441c2ad888c96b62b2fc6","c88f9cfc8c8846499bac0faace319921","438c39c7c97e4172a8c4e4c29e0dde86","e4244f9bd21a4f8caa038e1922cdac85","53d371fdcd4c47cdbb60b68e14693c18","24225d17f2c24048aba70043851fc616","7f13470e9f874a859edd3ad81dc2eef3","65503a9084df4525a199b732b8b56478","20a51f65184b41878c4938609b48ca6c","2ea815fd8b3f4d0883166e93ad3c5289","1361a74b2aef49ea98deafe7027bd568","d532b5fe357a401da221671ff12c8904","a8e5ad44d09c4e2189719bef46e7a39f","0e0e1632da714b19b8baef34c1210473","aba6113b613d458abd74686aeae13657","729afdc7fb37406ca334d8fb8a77e58a","3b65129b567b44019e0b37c8401b8ed2","ed353f256ab6492891bf10d32f051e45","bbaf656fa94f413b959797d47353a049","b659b1d8cc544a608200d5ef5076818e","497cde8c9a81401f92afa18ba9a6ce40","45ad6503850542a8a2f7a3b0479e88ca","d276f99074864c0cbcd8daa17e5f6d2f","04cebfae2d984f07a97351116037e3cf","c94595332c0c4f18afde731efbaba866","587bdb3634a24c638696bcd9fe21368c","dc450f9305da4afcbb4e6a1bf77c3590","884ace4175f94127b1674352d17e67f2","3901be176ed144b986f20a7a7a72f8e2","7259afa2646a414ebb90f486242e3661","a09e4534caef4b43862c275a59617c6b"]},"id":"q5Jz0E_oPMBr","executionInfo":{"status":"ok","timestamp":1676654828626,"user_tz":-60,"elapsed":1440,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"5f1635b6-2904-4994-9161-4a3ecafc6896"},"execution_count":7,"outputs":[{"output_type":"display_data","data":{"text/plain":["Downloading (…)okenizer_config.json: 0%| | 0.00/2.54k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"6a27116f01b648ef942141677975405d"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)\"spiece.model\";: 0%| | 0.00/792k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"d195065e792b496fa0674d96d80bc5e7"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)/main/tokenizer.json: 0%| | 0.00/2.42M [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"2ea815fd8b3f4d0883166e93ad3c5289"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)cial_tokens_map.json: 0%| | 0.00/2.20k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"497cde8c9a81401f92afa18ba9a6ce40"}},"metadata":{}}]},{"cell_type":"code","source":["sms = parsed_dataset[0]['sms']\n","print('Original: ', sms)\n","print('Tokenized: ', tokenizer.tokenize(sms))\n","print('Token IDs: ', tokenizer.convert_tokens_to_ids(tokenizer.tokenize(sms)))"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"dfxJQpoePsvI","executionInfo":{"status":"ok","timestamp":1676654828626,"user_tz":-60,"elapsed":10,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"fccd3b61-53c9-49ed-f480-f5894e926059"},"execution_count":8,"outputs":[{"output_type":"stream","name":"stdout","text":["Original: Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\n","Tokenized: ['▁Go', '▁until', '▁jur', 'ong', '▁point', ',', '▁crazy', '.', '.', '▁Available', '▁only', '▁in', '▁bug', 'is', '▁', 'n', '▁great', '▁world', '▁la', '▁', 'e', '▁buffet', '...', '▁Cine', '▁there', '▁got', '▁', 'a', 'more', '▁wa', 't', '...']\n","Token IDs: [1263, 552, 10081, 2444, 500, 6, 6139, 5, 5, 8144, 163, 16, 8143, 159, 3, 29, 248, 296, 50, 3, 15, 15385, 233, 17270, 132, 530, 3, 9, 3706, 8036, 17, 233]\n"]}]},{"cell_type":"markdown","source":["# Few shot learning"],"metadata":{"id":"UpluhM8cU5Ir"}},{"cell_type":"code","source":["print(parsed_dataset[0]) #0\n","print(parsed_dataset[123]) #1\n","print(parsed_dataset[2000]) #0\n","print(parsed_dataset[3002]) #1"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"7uNUkixPU85O","executionInfo":{"status":"ok","timestamp":1676654828627,"user_tz":-60,"elapsed":9,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"56579b1f-a2f7-4de5-83c7-d181b2cee335"},"execution_count":9,"outputs":[{"output_type":"stream","name":"stdout","text":["{'sms': 'Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...', 'label': 'False'}\n","{'sms': 'Todays Voda numbers ending 7548 are selected to receive a $350 award. If you have a match please call 08712300220 quoting claim code 4041 standard rates app', 'label': 'True'}\n","{'sms': \"LMAO where's your fish memory when I need it?\", 'label': 'False'}\n","{'sms': 'This message is free. Welcome to the new & improved Sex & Dogging club! To unsubscribe from this service reply STOP. msgs@150p 18+only', 'label': 'True'}\n"]}]},{"cell_type":"code","source":["non_spam_1 = \"The text message contains the following content: \" + parsed_dataset[0]['sms'] + \"\\nIs it true that the content of a text message is spam: False\\n\\n\"\n","spam_1 = \"The text message contains the following content: \" + parsed_dataset[123]['sms'] + \"\\nIs it true that the content of a text message is spam: True\\n\\n\"\n","non_spam_2 = \"The text message contains the following content: \" + parsed_dataset[2000]['sms'] + \"\\nIs it true that the content of a text message is spam: False\\n\\n\"\n","spam_2 = \"The text message contains the following content: \" + parsed_dataset[3002]['sms'] + \"\\nIs it true that the content of a text message is spam: True\\n\\n\"\n","\n","few_shot_prefix = non_spam_1 + spam_1 + non_spam_2 + spam_2 + \"The text message contains the following content: \"\n","print(few_shot_prefix)"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"lj0issBznZfK","executionInfo":{"status":"ok","timestamp":1676654828627,"user_tz":-60,"elapsed":7,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"4e55029a-d838-45fa-c08c-98b957ceb642"},"execution_count":10,"outputs":[{"output_type":"stream","name":"stdout","text":["The text message contains the following content: Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\n","Is it true that the content of a text message is spam: False\n","\n","The text message contains the following content: Todays Voda numbers ending 7548 are selected to receive a $350 award. If you have a match please call 08712300220 quoting claim code 4041 standard rates app\n","Is it true that the content of a text message is spam: True\n","\n","The text message contains the following content: LMAO where's your fish memory when I need it?\n","Is it true that the content of a text message is spam: False\n","\n","The text message contains the following content: This message is free. Welcome to the new & improved Sex & Dogging club! To unsubscribe from this service reply STOP. msgs@150p 18+only\n","Is it true that the content of a text message is spam: True\n","\n","The text message contains the following content: \n"]}]},{"cell_type":"markdown","source":["# Load FLAN-T5 model"],"metadata":{"id":"okTx_ynMV0rH"}},{"cell_type":"code","source":["from transformers import AutoModelForSeq2SeqLM"],"metadata":{"id":"Eu-7Eed8WgN0","executionInfo":{"status":"ok","timestamp":1676654828628,"user_tz":-60,"elapsed":6,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}}},"execution_count":11,"outputs":[]},{"cell_type":"code","source":["model = AutoModelForSeq2SeqLM.from_pretrained('google/flan-t5-large')\n","\n","model.cuda()"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":1000,"referenced_widgets":["8e0c9ce977054a879a1929e1c030a6a3","bde5c3406f0e46d8ab30a8b9f1355d5c","91505f004c3742e68e9a70155fedcf2e","0a7e5af5e2b64c488432b9563401c299","4c8fd9d5d7364812900f4e35490948fd","64d4b67445c34a6182c2b1ec07339b22","c4f9e0afdb334188abaee11b383a0142","8ce37c30b02646148b9694a14e21fbce","6a3fff3870b34941b4713c984c3c681c","5ba546d284b04dee96c132985a8bd38c","534b173a13c544e48af4051d748b89b8","2c7e377fed4241fbab8730fd850f5905","1c7b9fccd53043c0a9d84ae3c6caabd4","e0423e68cdf64c8cb0e2643c20c8f3cd","440dbb34f66a4ea8b4138da6dcb7d269","d55e16b317a348fdb8f677cc5cab99cb","f17117c9c86141e89c394b598f1c391a","7635e183b25f42499d438febea66e8ea","bcc42f2b6d3847b5b9127503f09c805d","95b7176944d74bed8d65239f0dd572cc","a680a0a6142f4b86bd4b926320ded47c","3a80de03299742baa8a05a6f6dc11e65","c707fedbf7564e6195c9339dd850a29a","9de390b272414e62a761112ab5f6f2c5","97c6386f6734441cbf30b8cd92e618fe","70dfc5bbac0145e097ff98485435ae37","d18f22d2d3274b57a622ffc8aed5b745","452dc83d4775438dbd6f5d70b0a9c281","24ce51b9d54f4203bd402280ad319bbd","582ac43518ca4ea7ae2a34e0cd705471","48eed9b0ef6a45b9a32e22b468a14d60","f8372f868b054d3798eaf1e1f4c40838","105d6b2a260848849b6fed4593d4a8d8"]},"id":"JKv9O8kfV2zZ","executionInfo":{"status":"ok","timestamp":1676654878825,"user_tz":-60,"elapsed":50202,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"802742eb-cd94-4500-f299-13dc8cd41887"},"execution_count":12,"outputs":[{"output_type":"display_data","data":{"text/plain":["Downloading (…)lve/main/config.json: 0%| | 0.00/662 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"8e0c9ce977054a879a1929e1c030a6a3"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)\"pytorch_model.bin\";: 0%| | 0.00/3.13G [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"2c7e377fed4241fbab8730fd850f5905"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)neration_config.json: 0%| | 0.00/147 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"c707fedbf7564e6195c9339dd850a29a"}},"metadata":{}},{"output_type":"execute_result","data":{"text/plain":["T5ForConditionalGeneration(\n"," (shared): Embedding(32128, 1024)\n"," (encoder): T5Stack(\n"," (embed_tokens): Embedding(32128, 1024)\n"," (block): ModuleList(\n"," (0): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," (relative_attention_bias): Embedding(32, 16)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (1): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (2): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (3): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (4): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (5): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (6): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (7): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (8): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (9): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (10): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (11): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (12): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (13): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (14): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (15): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (16): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (17): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (18): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (19): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (20): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (21): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (22): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (23): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," )\n"," (final_layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (decoder): T5Stack(\n"," (embed_tokens): Embedding(32128, 1024)\n"," (block): ModuleList(\n"," (0): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," (relative_attention_bias): Embedding(32, 16)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (1): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (2): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (3): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (4): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (5): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (6): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (7): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (8): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (9): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (10): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (11): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (12): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (13): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (14): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (15): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (16): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (17): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (18): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (19): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (20): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (21): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (22): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (23): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," )\n"," (final_layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (lm_head): Linear(in_features=1024, out_features=32128, bias=False)\n",")"]},"metadata":{},"execution_count":12}]},{"cell_type":"markdown","source":["# Helper functions"],"metadata":{"id":"F_SDAwxoawDy"}},{"cell_type":"code","source":["import torch"],"metadata":{"id":"rdWMg_KJZEZH","executionInfo":{"status":"ok","timestamp":1676654878826,"user_tz":-60,"elapsed":16,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}}},"execution_count":13,"outputs":[]},{"cell_type":"code","source":["def calculate_accuracy(preds, target):\n"," results_ok = 0.0\n"," results_false = 0.0\n","\n"," for idx, pred in enumerate(preds):\n"," if pred == target[idx]:\n"," results_ok += 1.0\n"," else:\n"," results_false += 1.0\n","\n"," return results_ok / (results_ok + results_false)"],"metadata":{"id":"FzUi8908ax61","executionInfo":{"status":"ok","timestamp":1676654878826,"user_tz":-60,"elapsed":15,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}}},"execution_count":14,"outputs":[]},{"cell_type":"code","source":["if torch.cuda.is_available(): \n"," device = torch.device(\"cuda\")\n","\n"," print('There are %d GPU(s) available.' % torch.cuda.device_count())\n"," print('We will use the GPU:', torch.cuda.get_device_name(0))\n","\n","else:\n"," print('No GPU available, using the CPU instead.')\n"," device = torch.device(\"cpu\")"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"86i7iRmtW-6L","executionInfo":{"status":"ok","timestamp":1676654878826,"user_tz":-60,"elapsed":15,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"66e7c490-7cc0-4665-b342-284b55329d16"},"execution_count":15,"outputs":[{"output_type":"stream","name":"stdout","text":["There are 1 GPU(s) available.\n","We will use the GPU: Tesla T4\n"]}]},{"cell_type":"markdown","source":["# Predykcja"],"metadata":{"id":"H_YI3bS3VHQE"}},{"cell_type":"code","source":["parsed_dataset = parsed_dataset[1:123] + parsed_dataset[124:2000] + parsed_dataset[2001:3002] + parsed_dataset[3003:]\n","predictions = []\n","expected = []\n","\n","for row in parsed_dataset:\n"," input_text = few_shot_prefix + row['sms'] + \"\\nIs it true that the content of a text message is spam: \"\n"," input_ids = tokenizer(input_text, return_tensors=\"pt\").input_ids.to(device)\n","\n"," generated_ids = model.generate(input_ids, do_sample=True, temperature=0.9, max_length=250)\n"," generated_text = tokenizer.decode(generated_ids[0], skip_special_tokens=True, clean_up_tokenization_spaces=True)\n"," \n"," predictions.append(generated_text)\n"," expected.append(row['label'])\n","\n","acc = calculate_accuracy(predictions, expected)\n","print(acc)"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"vunLGuBGVGmh","executionInfo":{"status":"ok","timestamp":1676656236490,"user_tz":-60,"elapsed":905220,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"9cf4e39e-ebbc-4f36-9a07-17a392ddb8d2"},"execution_count":17,"outputs":[{"output_type":"stream","name":"stdout","text":["0.1433704635285663\n"]}]},{"cell_type":"code","source":["print(\"Sample prediction: {}, expected: {}\".format(predictions[101], expected[101]))"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"20WbYZmLaDl7","executionInfo":{"status":"ok","timestamp":1676656236491,"user_tz":-60,"elapsed":8,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"b1109d93-fbaa-42d4-9b36-c302e9e9f1ff"},"execution_count":18,"outputs":[{"output_type":"stream","name":"stdout","text":["Sample prediction: False, expected: False\n"]}]},{"cell_type":"markdown","source":["# MCC Score"],"metadata":{"id":"dLYc9WXz_B1o"}},{"cell_type":"code","source":["from sklearn.metrics import matthews_corrcoef\n","\n","print('Calculating Matthews Corr. Coef. for each batch...')\n","matthews = matthews_corrcoef(expected, predictions) \n","print('Total MCC: %.3f' % matthews)"],"metadata":{"id":"hPEPpXXX_DXR","executionInfo":{"status":"ok","timestamp":1676656237402,"user_tz":-60,"elapsed":915,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"colab":{"base_uri":"https://localhost:8080/"},"outputId":"d3862278-19af-4c01-85ef-51cfc63bbf9f"},"execution_count":19,"outputs":[{"output_type":"stream","name":"stdout","text":["Calculating Matthews Corr. Coef. for each batch...\n","Total MCC: 0.055\n"]}]},{"cell_type":"markdown","source":["# Save model"],"metadata":{"id":"GPhCp068_Iwq"}},{"cell_type":"code","source":["from google.colab import drive\n","\n","drive.mount('/content/gdrive/', force_remount=True)\n","\n","output_dir = '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_4_FLAN-T5_Model'\n","print(\"Saving model to %s\" % output_dir)\n","\n","model_to_save = model.module if hasattr(model, 'module') else model\n","model_to_save.save_pretrained(output_dir)\n","tokenizer.save_pretrained(output_dir)"],"metadata":{"id":"avafCMoS_KDF","colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"status":"ok","timestamp":1676656370608,"user_tz":-60,"elapsed":133210,"user":{"displayName":"Mike2 Studia2","userId":"10506861792614965645"}},"outputId":"11a9bbd2-c5aa-4147-bc0d-633cda86b955"},"execution_count":20,"outputs":[{"output_type":"stream","name":"stdout","text":["Mounted at /content/gdrive/\n","Saving model to /content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_4_FLAN-T5_Model\n"]},{"output_type":"execute_result","data":{"text/plain":["('/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_4_FLAN-T5_Model/tokenizer_config.json',\n"," '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_4_FLAN-T5_Model/special_tokens_map.json',\n"," '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_4_FLAN-T5_Model/spiece.model',\n"," '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_4_FLAN-T5_Model/added_tokens.json',\n"," '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_4_FLAN-T5_Model/tokenizer.json')"]},"metadata":{},"execution_count":20}]},{"cell_type":"markdown","source":["# Bibliografia\n","- https://huggingface.co/docs/transformers/main/en/model_doc/flan-t5\n","- https://mccormickml.com/2019/07/22/BERT-fine-tuning/#a1-saving--loading-fine-tuned-model\n","- https://huggingface.co/docs/transformers/model_doc/t5#training"],"metadata":{"id":"wHzm2_nDA6i-"}}]}