Przetwarzanie_tekstu/projekt/Ver_6_FLAN-T5_sms_spam.ipynb
2023-02-17 19:21:51 +01:00

1 line
199 KiB
Plaintext
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"provenance":[]},"kernelspec":{"name":"python3","display_name":"Python 3"},"language_info":{"name":"python"},"gpuClass":"standard","widgets":{"application/vnd.jupyter.widget-state+json":{"c9c5041c2d734e449a3f480d27c6930f":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_93c307f83f8345569c6d5eb992facb8f","IPY_MODEL_0b1c4594b3394af9bf6bdb1f5c21efde","IPY_MODEL_8acffba7f8d841bca237676946643b85"],"layout":"IPY_MODEL_6cd1d313107b458fa45e5872c9ce66f0"}},"93c307f83f8345569c6d5eb992facb8f":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_d6a531cb1e5442398ad46a7555af15ff","placeholder":"","style":"IPY_MODEL_a682581443054d6ab11c4445b59ebaf8","value":"Downloading builder script: 100%"}},"0b1c4594b3394af9bf6bdb1f5c21efde":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_7eca2a8a527c417794f7902354dff4fa","max":3208,"min":0,"orientation":"horizontal","style":"IPY_MODEL_44c053a9f38d42ff8b1a37e7892a87d2","value":3208}},"8acffba7f8d841bca237676946643b85":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_086a54cdf54a4631b1d8aa8c835f74a5","placeholder":"","style":"IPY_MODEL_5334c04227694b0dbfca313b8b3c1b73","value":" 3.21k/3.21k [00:00&lt;00:00, 148kB/s]"}},"6cd1d313107b458fa45e5872c9ce66f0":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d6a531cb1e5442398ad46a7555af15ff":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"a682581443054d6ab11c4445b59ebaf8":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"7eca2a8a527c417794f7902354dff4fa":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"44c053a9f38d42ff8b1a37e7892a87d2":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"086a54cdf54a4631b1d8aa8c835f74a5":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5334c04227694b0dbfca313b8b3c1b73":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ed0315a7a3734a9096b646d6087113d5":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_63e57336638c43269033927fea082b5e","IPY_MODEL_5c74805203c149a28b39b8a6673b3226","IPY_MODEL_bb1356f3522c48779c6ef331fd0cb258"],"layout":"IPY_MODEL_a9764585f1304fac85a4647205a07248"}},"63e57336638c43269033927fea082b5e":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_fe9a18c0f645464687a47a598c29856c","placeholder":"","style":"IPY_MODEL_4cac33b53d5c47bf9e2559a19d786ba7","value":"Downloading metadata: 100%"}},"5c74805203c149a28b39b8a6673b3226":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_c9c783ba8f2c47d2a63f6008c6c7ebf6","max":1687,"min":0,"orientation":"horizontal","style":"IPY_MODEL_97a86f253eed42059461528ac274ff5f","value":1687}},"bb1356f3522c48779c6ef331fd0cb258":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_db85eaf5afc64c258db557856084caa7","placeholder":"","style":"IPY_MODEL_08e5985a87ce49469632b644a0be1e4a","value":" 1.69k/1.69k [00:00&lt;00:00, 113kB/s]"}},"a9764585f1304fac85a4647205a07248":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fe9a18c0f645464687a47a598c29856c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"4cac33b53d5c47bf9e2559a19d786ba7":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"c9c783ba8f2c47d2a63f6008c6c7ebf6":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"97a86f253eed42059461528ac274ff5f":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"db85eaf5afc64c258db557856084caa7":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"08e5985a87ce49469632b644a0be1e4a":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"6705f6b0f9754c0ebc4cb0dc1a37ac94":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_3843c8652968472fb3bfb4ce97b7c45b","IPY_MODEL_a248a43d17ab4633b88a1621942d4757","IPY_MODEL_37c5cf19bd0646aa9ce53218326424f7"],"layout":"IPY_MODEL_f55517fb17e0463e8c8b01f358534914"}},"3843c8652968472fb3bfb4ce97b7c45b":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_fddbdaedf5654097942c38002a299e3f","placeholder":"","style":"IPY_MODEL_10ed5de382e244d8a56c47c76d90748f","value":"Downloading readme: 100%"}},"a248a43d17ab4633b88a1621942d4757":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_e559dfd597ad454b8d8c2ee005901a35","max":4872,"min":0,"orientation":"horizontal","style":"IPY_MODEL_f48f84cd18ab43b39bf2ca69599ad8c7","value":4872}},"37c5cf19bd0646aa9ce53218326424f7":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_1c40bc5715ea448697ac53773d86237a","placeholder":"","style":"IPY_MODEL_fc419546e84144349e9c533a8176d4e4","value":" 4.87k/4.87k [00:00&lt;00:00, 87.7kB/s]"}},"f55517fb17e0463e8c8b01f358534914":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fddbdaedf5654097942c38002a299e3f":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"10ed5de382e244d8a56c47c76d90748f":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"e559dfd597ad454b8d8c2ee005901a35":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"f48f84cd18ab43b39bf2ca69599ad8c7":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"1c40bc5715ea448697ac53773d86237a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fc419546e84144349e9c533a8176d4e4":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"9b3a088c8a7a49b496c6b2e5d2d474dd":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_a803fe9e84344cdfac171dc6343121e5","IPY_MODEL_12f4b7d3045340d99001a098e0600c64","IPY_MODEL_a92495c6264a4256b9d1c4dd207d9041"],"layout":"IPY_MODEL_c0f1d46ebbdc4bfe8d31985f71875962"}},"a803fe9e84344cdfac171dc6343121e5":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e2a740892ddf477ba0b404b1e7e2cd88","placeholder":"","style":"IPY_MODEL_b4eb68bbd452409f8faf6f77093f84da","value":"Downloading data: 100%"}},"12f4b7d3045340d99001a098e0600c64":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_9f8452af363d4a0daf38a7edf7d0a540","max":203415,"min":0,"orientation":"horizontal","style":"IPY_MODEL_ec09103848594bc38e167a16a407cc04","value":203415}},"a92495c6264a4256b9d1c4dd207d9041":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_5b8f226314054f1f893d922347c31055","placeholder":"","style":"IPY_MODEL_9e4f882e90234dbca0702be76099be77","value":" 203k/203k [00:00&lt;00:00, 231kB/s]"}},"c0f1d46ebbdc4bfe8d31985f71875962":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e2a740892ddf477ba0b404b1e7e2cd88":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"b4eb68bbd452409f8faf6f77093f84da":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"9f8452af363d4a0daf38a7edf7d0a540":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ec09103848594bc38e167a16a407cc04":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"5b8f226314054f1f893d922347c31055":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"9e4f882e90234dbca0702be76099be77":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ef20074dae184d8cb1ead4ce74c2df0b":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_b4721cb7a4f1486384078edb29a219f5","IPY_MODEL_b8194c781462455ab6b975689d934be3","IPY_MODEL_4cafb17414cf4413b70b04381b3783ca"],"layout":"IPY_MODEL_70819e011c9a4e759758ec8b1e6116f4"}},"b4721cb7a4f1486384078edb29a219f5":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_bfd5db4a4c9f4a0a9165e3b3a34f6e32","placeholder":"","style":"IPY_MODEL_50586a5a007f438d94dad66ad03ca1ba","value":"Generating train split: 96%"}},"b8194c781462455ab6b975689d934be3":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"","description":"","description_tooltip":null,"layout":"IPY_MODEL_7295282fb11d4c95aac18ce9047f4da2","max":5574,"min":0,"orientation":"horizontal","style":"IPY_MODEL_1354813182d7427b87f56a8aafc06c34","value":5574}},"4cafb17414cf4413b70b04381b3783ca":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_eaadb5abf84d455994f5378aac2a293c","placeholder":"","style":"IPY_MODEL_dc7f94f8535a4734a3cd9fc9cef5fc2e","value":" 5332/5574 [00:00&lt;00:00, 6106.61 examples/s]"}},"70819e011c9a4e759758ec8b1e6116f4":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":"hidden","width":null}},"bfd5db4a4c9f4a0a9165e3b3a34f6e32":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"50586a5a007f438d94dad66ad03ca1ba":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"7295282fb11d4c95aac18ce9047f4da2":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"1354813182d7427b87f56a8aafc06c34":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"eaadb5abf84d455994f5378aac2a293c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"dc7f94f8535a4734a3cd9fc9cef5fc2e":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"e5985e951e854e4fbdc8983b57830209":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_14ecc67173cd4eb2a20d51f817a01a29","IPY_MODEL_bd66d5b4736647a89ec35d65d55f7556","IPY_MODEL_eece11a05e874005ae2532f8139490d0"],"layout":"IPY_MODEL_7ba99dc8284d436f83a341d914e3b226"}},"14ecc67173cd4eb2a20d51f817a01a29":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_91b51e4d897843648bc69a4dc684f4bf","placeholder":"","style":"IPY_MODEL_def43747b4624cd693383277e8520e1a","value":"100%"}},"bd66d5b4736647a89ec35d65d55f7556":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_438240aff4aa4c30ab5dc8a1159f32be","max":1,"min":0,"orientation":"horizontal","style":"IPY_MODEL_12772e6a0d1d40e9934ba6c663896c17","value":1}},"eece11a05e874005ae2532f8139490d0":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_68911a228fc343bbb84fd7f6b53f5fb4","placeholder":"","style":"IPY_MODEL_9de6fd732fbb4ff5b917f8250710d342","value":" 1/1 [00:00&lt;00:00, 10.37it/s]"}},"7ba99dc8284d436f83a341d914e3b226":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"91b51e4d897843648bc69a4dc684f4bf":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"def43747b4624cd693383277e8520e1a":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"438240aff4aa4c30ab5dc8a1159f32be":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"12772e6a0d1d40e9934ba6c663896c17":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"68911a228fc343bbb84fd7f6b53f5fb4":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"9de6fd732fbb4ff5b917f8250710d342":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ac64c83f91604136a8605a458cfdb558":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_a51333fd9ed341119a8517ead52bed95","IPY_MODEL_b975f63617a6419d826d5999c33dadcd","IPY_MODEL_71f6deb181d04ac495d8be7405a9daea"],"layout":"IPY_MODEL_d5d18a69055b496fb29c737c940c6a3d"}},"a51333fd9ed341119a8517ead52bed95":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_2225a24fcae94178a948e2f05d7499db","placeholder":"","style":"IPY_MODEL_d57673cadfd245e49e339f780362d602","value":"Downloading (…)okenizer_config.json: 100%"}},"b975f63617a6419d826d5999c33dadcd":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_b084661df41c4fa4a69c546ddcaf519c","max":2539,"min":0,"orientation":"horizontal","style":"IPY_MODEL_da2ba9bcf72b44348065ec345f554008","value":2539}},"71f6deb181d04ac495d8be7405a9daea":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_3db12e0df160443c8da290f79d903457","placeholder":"","style":"IPY_MODEL_2db89d52056c47c2b006c44fe89bce32","value":" 2.54k/2.54k [00:00&lt;00:00, 94.1kB/s]"}},"d5d18a69055b496fb29c737c940c6a3d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2225a24fcae94178a948e2f05d7499db":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d57673cadfd245e49e339f780362d602":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"b084661df41c4fa4a69c546ddcaf519c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"da2ba9bcf72b44348065ec345f554008":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"3db12e0df160443c8da290f79d903457":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2db89d52056c47c2b006c44fe89bce32":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"b9a1683bd7c44127a700a62df09c2740":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_82755a88b96941869f355139ff33a34c","IPY_MODEL_17dd1a7fa4e84a1481d312dd1e28923a","IPY_MODEL_46a6f706851e4560b89141611e15622a"],"layout":"IPY_MODEL_17e7ff1b5cb7470fac1f0f38121249e3"}},"82755a88b96941869f355139ff33a34c":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_220022b208354cee812400428d506b0e","placeholder":"","style":"IPY_MODEL_cc04a0bcdec04b87a50de06e9608e0a8","value":"Downloading (…)&quot;spiece.model&quot;;: 100%"}},"17dd1a7fa4e84a1481d312dd1e28923a":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_7f4c9a22e5a248dcbe6c4ab8914f2b88","max":791656,"min":0,"orientation":"horizontal","style":"IPY_MODEL_2aca6bfbf4a042bd9cdabac6faea656a","value":791656}},"46a6f706851e4560b89141611e15622a":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_82fa70ea09ad4c4eb2093f98be68e8bd","placeholder":"","style":"IPY_MODEL_f4f79c7b555743f781455e50e7ad5195","value":" 792k/792k [00:00&lt;00:00, 12.9MB/s]"}},"17e7ff1b5cb7470fac1f0f38121249e3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"220022b208354cee812400428d506b0e":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"cc04a0bcdec04b87a50de06e9608e0a8":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"7f4c9a22e5a248dcbe6c4ab8914f2b88":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2aca6bfbf4a042bd9cdabac6faea656a":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"82fa70ea09ad4c4eb2093f98be68e8bd":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"f4f79c7b555743f781455e50e7ad5195":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"65666ee0fa8a4deba2622e36080ecd97":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_dfc256fdbbde41d383cfd17a816a03af","IPY_MODEL_f0943adb3d7e49acae2884996ef84e55","IPY_MODEL_a10e0d0a45354a8cab4a35b4a386002d"],"layout":"IPY_MODEL_60ad900c6fd34543991b0cc8f0d79a4b"}},"dfc256fdbbde41d383cfd17a816a03af":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_11ff41869104483a931cd5a43fd74c4e","placeholder":"","style":"IPY_MODEL_a9cfc053290c4a08b22e53c05c42e87b","value":"Downloading (…)/main/tokenizer.json: 100%"}},"f0943adb3d7e49acae2884996ef84e55":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_ed3e08f7e12c42559538eadc46f14809","max":2424064,"min":0,"orientation":"horizontal","style":"IPY_MODEL_6848b004ea514c2c9ae116238dba366a","value":2424064}},"a10e0d0a45354a8cab4a35b4a386002d":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_3e4929d3364347d78c15da39b2551946","placeholder":"","style":"IPY_MODEL_83dd446c6cca41d5b223b1aceb2b3a81","value":" 2.42M/2.42M [00:01&lt;00:00, 1.55MB/s]"}},"60ad900c6fd34543991b0cc8f0d79a4b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"11ff41869104483a931cd5a43fd74c4e":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"a9cfc053290c4a08b22e53c05c42e87b":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ed3e08f7e12c42559538eadc46f14809":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"6848b004ea514c2c9ae116238dba366a":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"3e4929d3364347d78c15da39b2551946":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"83dd446c6cca41d5b223b1aceb2b3a81":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ad2b545f2d664bfcb1741a22db968a2c":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_57c9b5f2ac4445678ca22097a0222a03","IPY_MODEL_eb514ffa1ffa4d749f7fbdbb63733f8f","IPY_MODEL_3832a5693a3b40de8b27994db2538349"],"layout":"IPY_MODEL_565869b254044fa38b7df55e68bab5fd"}},"57c9b5f2ac4445678ca22097a0222a03":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_38c015739d2e4c99a3834959c0563950","placeholder":"","style":"IPY_MODEL_051a111f2e2d4e389cb34475b7d9d5d9","value":"Downloading (…)cial_tokens_map.json: 100%"}},"eb514ffa1ffa4d749f7fbdbb63733f8f":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_56bf48cbe4aa48c3aea421cb37812259","max":2201,"min":0,"orientation":"horizontal","style":"IPY_MODEL_c7990b0e47894b84af6b799ac005e994","value":2201}},"3832a5693a3b40de8b27994db2538349":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_5a31c0906b7d4fc38689030779748823","placeholder":"","style":"IPY_MODEL_9adaf24ddb6b4ac0a8cda15269e5106f","value":" 2.20k/2.20k [00:00&lt;00:00, 58.4kB/s]"}},"565869b254044fa38b7df55e68bab5fd":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"38c015739d2e4c99a3834959c0563950":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"051a111f2e2d4e389cb34475b7d9d5d9":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"56bf48cbe4aa48c3aea421cb37812259":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c7990b0e47894b84af6b799ac005e994":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"5a31c0906b7d4fc38689030779748823":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"9adaf24ddb6b4ac0a8cda15269e5106f":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"902d51de5d15490b8e40d51cb9d2a6d7":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_f745f516f9814e7293f677e50eaded2f","IPY_MODEL_7761bcc878504db19a4b2662cfdf61a9","IPY_MODEL_ab1cfad8dc994780b6b980b751531e0e"],"layout":"IPY_MODEL_356fa367dabf4efb9c0f858bcd582db5"}},"f745f516f9814e7293f677e50eaded2f":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_a76f15514a734a2ca57c95d6e5d28c1a","placeholder":"","style":"IPY_MODEL_2895697d2a7b4a4988cb782b45744af0","value":"Downloading (…)lve/main/config.json: 100%"}},"7761bcc878504db19a4b2662cfdf61a9":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_c5ff7a768dc6432cab747b037bc99480","max":662,"min":0,"orientation":"horizontal","style":"IPY_MODEL_233a81cabbbe404e87d98de3eb641fc0","value":662}},"ab1cfad8dc994780b6b980b751531e0e":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_d7950561457141e98485648c507beae4","placeholder":"","style":"IPY_MODEL_e2a49b71a2be4b818d34549552158f21","value":" 662/662 [00:00&lt;00:00, 16.4kB/s]"}},"356fa367dabf4efb9c0f858bcd582db5":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"a76f15514a734a2ca57c95d6e5d28c1a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2895697d2a7b4a4988cb782b45744af0":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"c5ff7a768dc6432cab747b037bc99480":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"233a81cabbbe404e87d98de3eb641fc0":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"d7950561457141e98485648c507beae4":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e2a49b71a2be4b818d34549552158f21":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"8b43cd40eb594e3d974fb47a63013eba":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_ca360690cbc348fcb0b594cc56434017","IPY_MODEL_b95287e1033b4645a21029cb4ffab619","IPY_MODEL_81ea2572afde4cb09ac364307785d38d"],"layout":"IPY_MODEL_23bbfb2b32044784a49e7b08b90e1302"}},"ca360690cbc348fcb0b594cc56434017":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_33ca6db178b84da19661fc3d62e09abb","placeholder":"","style":"IPY_MODEL_2da3ecb995514cb7a2fac91f49165f24","value":"Downloading (…)&quot;pytorch_model.bin&quot;;: 100%"}},"b95287e1033b4645a21029cb4ffab619":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_994a0a3fb8de4798bc5c3e34b27d2aa0","max":3132781861,"min":0,"orientation":"horizontal","style":"IPY_MODEL_15896f0b77164af7bdeb365755b3d478","value":3132781861}},"81ea2572afde4cb09ac364307785d38d":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_f1566112e762430397c9116cca9aa39b","placeholder":"","style":"IPY_MODEL_d33d0c19f0b542c5ac07ac1f2858e3a7","value":" 3.13G/3.13G [00:12&lt;00:00, 250MB/s]"}},"23bbfb2b32044784a49e7b08b90e1302":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"33ca6db178b84da19661fc3d62e09abb":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2da3ecb995514cb7a2fac91f49165f24":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"994a0a3fb8de4798bc5c3e34b27d2aa0":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"15896f0b77164af7bdeb365755b3d478":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"f1566112e762430397c9116cca9aa39b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d33d0c19f0b542c5ac07ac1f2858e3a7":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"b135be3639114a6ab0c587f08a889c82":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_9d8979ec18384dc2a297ce9a68d9bd9c","IPY_MODEL_3cce22420ff046d9872b08ce23e725a1","IPY_MODEL_f057f834fc8c45e4b46809f2ee1abad9"],"layout":"IPY_MODEL_2b0d399693ec4f8b9065e477fb573e1a"}},"9d8979ec18384dc2a297ce9a68d9bd9c":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_d53e8179d299450083ddf7e2cb1e473e","placeholder":"","style":"IPY_MODEL_7b38475b1275447cae202d0b60e6a207","value":"Downloading (…)neration_config.json: 100%"}},"3cce22420ff046d9872b08ce23e725a1":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_c27eec62191a46b7b37dbb72d3e7e864","max":147,"min":0,"orientation":"horizontal","style":"IPY_MODEL_5d250db552db494a815fa3ea51592e68","value":147}},"f057f834fc8c45e4b46809f2ee1abad9":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_fd3fec011f284d05b5d7d5e906174582","placeholder":"","style":"IPY_MODEL_a40e99f09452422b9460d9ec7a5f127e","value":" 147/147 [00:00&lt;00:00, 5.18kB/s]"}},"2b0d399693ec4f8b9065e477fb573e1a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d53e8179d299450083ddf7e2cb1e473e":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"7b38475b1275447cae202d0b60e6a207":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"c27eec62191a46b7b37dbb72d3e7e864":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5d250db552db494a815fa3ea51592e68":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"fd3fec011f284d05b5d7d5e906174582":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"a40e99f09452422b9460d9ec7a5f127e":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}}}},"accelerator":"GPU"},"cells":[{"cell_type":"markdown","source":["# Instalacja pakietów"],"metadata":{"id":"ZXsOR6oJOJbd"}},{"cell_type":"code","execution_count":1,"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"8l0hzptKNiZS","executionInfo":{"status":"ok","timestamp":1676655752895,"user_tz":-60,"elapsed":22903,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"e2ee6c4b-82e8-40b0-8c81-9c0b63be98f1"},"outputs":[{"output_type":"stream","name":"stdout","text":["Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/\n","Collecting transformers\n"," Downloading transformers-4.26.1-py3-none-any.whl (6.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m6.3/6.3 MB\u001b[0m \u001b[31m40.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting datasets\n"," Downloading datasets-2.9.0-py3-none-any.whl (462 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m462.8/462.8 KB\u001b[0m \u001b[31m24.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: torch in /usr/local/lib/python3.8/dist-packages (1.13.1+cu116)\n","Collecting sentencepiece\n"," Downloading sentencepiece-0.1.97-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (1.3 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.3/1.3 MB\u001b[0m \u001b[31m29.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: filelock in /usr/local/lib/python3.8/dist-packages (from transformers) (3.9.0)\n","Collecting tokenizers!=0.11.3,<0.14,>=0.11.1\n"," Downloading tokenizers-0.13.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (7.6 MB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m7.6/7.6 MB\u001b[0m \u001b[31m59.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: requests in /usr/local/lib/python3.8/dist-packages (from transformers) (2.25.1)\n","Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.8/dist-packages (from transformers) (2022.6.2)\n","Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.8/dist-packages (from transformers) (23.0)\n","Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.8/dist-packages (from transformers) (6.0)\n","Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.8/dist-packages (from transformers) (4.64.1)\n","Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.8/dist-packages (from transformers) (1.21.6)\n","Collecting huggingface-hub<1.0,>=0.11.0\n"," Downloading huggingface_hub-0.12.1-py3-none-any.whl (190 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m190.3/190.3 KB\u001b[0m \u001b[31m7.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: pandas in /usr/local/lib/python3.8/dist-packages (from datasets) (1.3.5)\n","Requirement already satisfied: aiohttp in /usr/local/lib/python3.8/dist-packages (from datasets) (3.8.4)\n","Requirement already satisfied: dill<0.3.7 in /usr/local/lib/python3.8/dist-packages (from datasets) (0.3.6)\n","Collecting multiprocess\n"," Downloading multiprocess-0.70.14-py38-none-any.whl (132 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m132.0/132.0 KB\u001b[0m \u001b[31m9.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: fsspec[http]>=2021.11.1 in /usr/local/lib/python3.8/dist-packages (from datasets) (2023.1.0)\n","Requirement already satisfied: pyarrow>=6.0.0 in /usr/local/lib/python3.8/dist-packages (from datasets) (9.0.0)\n","Collecting xxhash\n"," Downloading xxhash-3.2.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (213 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m213.0/213.0 KB\u001b[0m \u001b[31m4.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hCollecting responses<0.19\n"," Downloading responses-0.18.0-py3-none-any.whl (38 kB)\n","Requirement already satisfied: typing-extensions in /usr/local/lib/python3.8/dist-packages (from torch) (4.5.0)\n","Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.3.3)\n","Requirement already satisfied: charset-normalizer<4.0,>=2.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (3.0.1)\n","Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.3.1)\n","Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (6.0.4)\n","Requirement already satisfied: async-timeout<5.0,>=4.0.0a3 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (4.0.2)\n","Requirement already satisfied: yarl<2.0,>=1.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (1.8.2)\n","Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.8/dist-packages (from aiohttp->datasets) (22.2.0)\n","Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (2.10)\n","Requirement already satisfied: chardet<5,>=3.0.2 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (4.0.0)\n","Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (2022.12.7)\n","Requirement already satisfied: urllib3<1.27,>=1.21.1 in /usr/local/lib/python3.8/dist-packages (from requests->transformers) (1.24.3)\n","Collecting urllib3<1.27,>=1.21.1\n"," Downloading urllib3-1.26.14-py2.py3-none-any.whl (140 kB)\n","\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m140.6/140.6 KB\u001b[0m \u001b[31m9.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n","\u001b[?25hRequirement already satisfied: python-dateutil>=2.7.3 in /usr/local/lib/python3.8/dist-packages (from pandas->datasets) (2.8.2)\n","Requirement already satisfied: pytz>=2017.3 in /usr/local/lib/python3.8/dist-packages (from pandas->datasets) (2022.7.1)\n","Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.8/dist-packages (from python-dateutil>=2.7.3->pandas->datasets) (1.15.0)\n","Installing collected packages: tokenizers, sentencepiece, xxhash, urllib3, multiprocess, responses, huggingface-hub, transformers, datasets\n"," Attempting uninstall: urllib3\n"," Found existing installation: urllib3 1.24.3\n"," Uninstalling urllib3-1.24.3:\n"," Successfully uninstalled urllib3-1.24.3\n","Successfully installed datasets-2.9.0 huggingface-hub-0.12.1 multiprocess-0.70.14 responses-0.18.0 sentencepiece-0.1.97 tokenizers-0.13.2 transformers-4.26.1 urllib3-1.26.14 xxhash-3.2.0\n"]}],"source":["!pip install transformers datasets torch sentencepiece"]},{"cell_type":"markdown","source":["# Załadowanie datasetu"],"metadata":{"id":"dhN0rmb5Oi3d"}},{"cell_type":"code","source":["from datasets import load_dataset"],"metadata":{"id":"tnaDkwZ2Pbnn","executionInfo":{"status":"ok","timestamp":1676655754295,"user_tz":-60,"elapsed":1405,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}}},"execution_count":2,"outputs":[]},{"cell_type":"code","source":["dataset = load_dataset(\"sms_spam\")"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":232,"referenced_widgets":["c9c5041c2d734e449a3f480d27c6930f","93c307f83f8345569c6d5eb992facb8f","0b1c4594b3394af9bf6bdb1f5c21efde","8acffba7f8d841bca237676946643b85","6cd1d313107b458fa45e5872c9ce66f0","d6a531cb1e5442398ad46a7555af15ff","a682581443054d6ab11c4445b59ebaf8","7eca2a8a527c417794f7902354dff4fa","44c053a9f38d42ff8b1a37e7892a87d2","086a54cdf54a4631b1d8aa8c835f74a5","5334c04227694b0dbfca313b8b3c1b73","ed0315a7a3734a9096b646d6087113d5","63e57336638c43269033927fea082b5e","5c74805203c149a28b39b8a6673b3226","bb1356f3522c48779c6ef331fd0cb258","a9764585f1304fac85a4647205a07248","fe9a18c0f645464687a47a598c29856c","4cac33b53d5c47bf9e2559a19d786ba7","c9c783ba8f2c47d2a63f6008c6c7ebf6","97a86f253eed42059461528ac274ff5f","db85eaf5afc64c258db557856084caa7","08e5985a87ce49469632b644a0be1e4a","6705f6b0f9754c0ebc4cb0dc1a37ac94","3843c8652968472fb3bfb4ce97b7c45b","a248a43d17ab4633b88a1621942d4757","37c5cf19bd0646aa9ce53218326424f7","f55517fb17e0463e8c8b01f358534914","fddbdaedf5654097942c38002a299e3f","10ed5de382e244d8a56c47c76d90748f","e559dfd597ad454b8d8c2ee005901a35","f48f84cd18ab43b39bf2ca69599ad8c7","1c40bc5715ea448697ac53773d86237a","fc419546e84144349e9c533a8176d4e4","9b3a088c8a7a49b496c6b2e5d2d474dd","a803fe9e84344cdfac171dc6343121e5","12f4b7d3045340d99001a098e0600c64","a92495c6264a4256b9d1c4dd207d9041","c0f1d46ebbdc4bfe8d31985f71875962","e2a740892ddf477ba0b404b1e7e2cd88","b4eb68bbd452409f8faf6f77093f84da","9f8452af363d4a0daf38a7edf7d0a540","ec09103848594bc38e167a16a407cc04","5b8f226314054f1f893d922347c31055","9e4f882e90234dbca0702be76099be77","ef20074dae184d8cb1ead4ce74c2df0b","b4721cb7a4f1486384078edb29a219f5","b8194c781462455ab6b975689d934be3","4cafb17414cf4413b70b04381b3783ca","70819e011c9a4e759758ec8b1e6116f4","bfd5db4a4c9f4a0a9165e3b3a34f6e32","50586a5a007f438d94dad66ad03ca1ba","7295282fb11d4c95aac18ce9047f4da2","1354813182d7427b87f56a8aafc06c34","eaadb5abf84d455994f5378aac2a293c","dc7f94f8535a4734a3cd9fc9cef5fc2e","e5985e951e854e4fbdc8983b57830209","14ecc67173cd4eb2a20d51f817a01a29","bd66d5b4736647a89ec35d65d55f7556","eece11a05e874005ae2532f8139490d0","7ba99dc8284d436f83a341d914e3b226","91b51e4d897843648bc69a4dc684f4bf","def43747b4624cd693383277e8520e1a","438240aff4aa4c30ab5dc8a1159f32be","12772e6a0d1d40e9934ba6c663896c17","68911a228fc343bbb84fd7f6b53f5fb4","9de6fd732fbb4ff5b917f8250710d342"]},"id":"cCiAuRqrOkvV","executionInfo":{"status":"ok","timestamp":1676655766016,"user_tz":-60,"elapsed":11725,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"71c3bce0-d144-4064-c952-e39350da5879"},"execution_count":3,"outputs":[{"output_type":"display_data","data":{"text/plain":["Downloading builder script: 0%| | 0.00/3.21k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"c9c5041c2d734e449a3f480d27c6930f"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading metadata: 0%| | 0.00/1.69k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"ed0315a7a3734a9096b646d6087113d5"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading readme: 0%| | 0.00/4.87k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"6705f6b0f9754c0ebc4cb0dc1a37ac94"}},"metadata":{}},{"output_type":"stream","name":"stdout","text":["Downloading and preparing dataset sms_spam/plain_text to /root/.cache/huggingface/datasets/sms_spam/plain_text/1.0.0/53f051d3b5f62d99d61792c91acefe4f1577ad3e4c216fb0ad39e30b9f20019c...\n"]},{"output_type":"display_data","data":{"text/plain":["Downloading data: 0%| | 0.00/203k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"9b3a088c8a7a49b496c6b2e5d2d474dd"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Generating train split: 0%| | 0/5574 [00:00<?, ? examples/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"ef20074dae184d8cb1ead4ce74c2df0b"}},"metadata":{}},{"output_type":"stream","name":"stdout","text":["Dataset sms_spam downloaded and prepared to /root/.cache/huggingface/datasets/sms_spam/plain_text/1.0.0/53f051d3b5f62d99d61792c91acefe4f1577ad3e4c216fb0ad39e30b9f20019c. Subsequent calls will reuse this data.\n"]},{"output_type":"display_data","data":{"text/plain":[" 0%| | 0/1 [00:00<?, ?it/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"e5985e951e854e4fbdc8983b57830209"}},"metadata":{}}]},{"cell_type":"code","source":["dataset['train'][0]"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"JKFHPko3OnAV","executionInfo":{"status":"ok","timestamp":1676655766016,"user_tz":-60,"elapsed":19,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"568dc1d5-85a9-444a-e75a-4632ec63707d"},"execution_count":4,"outputs":[{"output_type":"execute_result","data":{"text/plain":["{'sms': 'Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\\n',\n"," 'label': 0}"]},"metadata":{},"execution_count":4}]},{"cell_type":"markdown","source":["# Przygotowanie datasetu"],"metadata":{"id":"l140vJrgYxPr"}},{"cell_type":"code","source":["parsed_dataset = []\n","\n","for row in dataset['train']:\n"," text = row['sms'].replace(\"\\n\", \"\")\n"," new_row = {}\n"," new_row['sms'] = text\n"," if row['label'] == 0:\n"," new_row['label'] = \"False\"\n"," else:\n"," new_row['label'] = \"True\"\n"," parsed_dataset.append(new_row)\n","\n","parsed_dataset[0]"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"1boUF-YiY3_y","executionInfo":{"status":"ok","timestamp":1676655766703,"user_tz":-60,"elapsed":703,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"1855e54f-cca7-46d4-b456-b7ef96820992"},"execution_count":5,"outputs":[{"output_type":"execute_result","data":{"text/plain":["{'sms': 'Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...',\n"," 'label': 'False'}"]},"metadata":{},"execution_count":5}]},{"cell_type":"markdown","source":["# Tokenizer FLAN-T5"],"metadata":{"id":"O-J-jBDxPJcn"}},{"cell_type":"code","source":["from transformers import AutoTokenizer"],"metadata":{"id":"P23AYPX1PZ6g","executionInfo":{"status":"ok","timestamp":1676655769374,"user_tz":-60,"elapsed":2673,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}}},"execution_count":6,"outputs":[]},{"cell_type":"code","source":["tokenizer = AutoTokenizer.from_pretrained('google/flan-t5-large')"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":145,"referenced_widgets":["ac64c83f91604136a8605a458cfdb558","a51333fd9ed341119a8517ead52bed95","b975f63617a6419d826d5999c33dadcd","71f6deb181d04ac495d8be7405a9daea","d5d18a69055b496fb29c737c940c6a3d","2225a24fcae94178a948e2f05d7499db","d57673cadfd245e49e339f780362d602","b084661df41c4fa4a69c546ddcaf519c","da2ba9bcf72b44348065ec345f554008","3db12e0df160443c8da290f79d903457","2db89d52056c47c2b006c44fe89bce32","b9a1683bd7c44127a700a62df09c2740","82755a88b96941869f355139ff33a34c","17dd1a7fa4e84a1481d312dd1e28923a","46a6f706851e4560b89141611e15622a","17e7ff1b5cb7470fac1f0f38121249e3","220022b208354cee812400428d506b0e","cc04a0bcdec04b87a50de06e9608e0a8","7f4c9a22e5a248dcbe6c4ab8914f2b88","2aca6bfbf4a042bd9cdabac6faea656a","82fa70ea09ad4c4eb2093f98be68e8bd","f4f79c7b555743f781455e50e7ad5195","65666ee0fa8a4deba2622e36080ecd97","dfc256fdbbde41d383cfd17a816a03af","f0943adb3d7e49acae2884996ef84e55","a10e0d0a45354a8cab4a35b4a386002d","60ad900c6fd34543991b0cc8f0d79a4b","11ff41869104483a931cd5a43fd74c4e","a9cfc053290c4a08b22e53c05c42e87b","ed3e08f7e12c42559538eadc46f14809","6848b004ea514c2c9ae116238dba366a","3e4929d3364347d78c15da39b2551946","83dd446c6cca41d5b223b1aceb2b3a81","ad2b545f2d664bfcb1741a22db968a2c","57c9b5f2ac4445678ca22097a0222a03","eb514ffa1ffa4d749f7fbdbb63733f8f","3832a5693a3b40de8b27994db2538349","565869b254044fa38b7df55e68bab5fd","38c015739d2e4c99a3834959c0563950","051a111f2e2d4e389cb34475b7d9d5d9","56bf48cbe4aa48c3aea421cb37812259","c7990b0e47894b84af6b799ac005e994","5a31c0906b7d4fc38689030779748823","9adaf24ddb6b4ac0a8cda15269e5106f"]},"id":"q5Jz0E_oPMBr","executionInfo":{"status":"ok","timestamp":1676655779499,"user_tz":-60,"elapsed":10128,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"ad9b827a-3914-4125-8689-7c002d6cbdda"},"execution_count":7,"outputs":[{"output_type":"display_data","data":{"text/plain":["Downloading (…)okenizer_config.json: 0%| | 0.00/2.54k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"ac64c83f91604136a8605a458cfdb558"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)\"spiece.model\";: 0%| | 0.00/792k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"b9a1683bd7c44127a700a62df09c2740"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)/main/tokenizer.json: 0%| | 0.00/2.42M [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"65666ee0fa8a4deba2622e36080ecd97"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)cial_tokens_map.json: 0%| | 0.00/2.20k [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"ad2b545f2d664bfcb1741a22db968a2c"}},"metadata":{}}]},{"cell_type":"code","source":["sms = parsed_dataset[0]['sms']\n","print('Original: ', sms)\n","print('Tokenized: ', tokenizer.tokenize(sms))\n","print('Token IDs: ', tokenizer.convert_tokens_to_ids(tokenizer.tokenize(sms)))"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"dfxJQpoePsvI","executionInfo":{"status":"ok","timestamp":1676655779500,"user_tz":-60,"elapsed":23,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"cb35d66e-ee83-47b0-8ae0-80f82f4efd1d"},"execution_count":8,"outputs":[{"output_type":"stream","name":"stdout","text":["Original: Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\n","Tokenized: ['▁Go', '▁until', '▁jur', 'ong', '▁point', ',', '▁crazy', '.', '.', '▁Available', '▁only', '▁in', '▁bug', 'is', '▁', 'n', '▁great', '▁world', '▁la', '▁', 'e', '▁buffet', '...', '▁Cine', '▁there', '▁got', '▁', 'a', 'more', '▁wa', 't', '...']\n","Token IDs: [1263, 552, 10081, 2444, 500, 6, 6139, 5, 5, 8144, 163, 16, 8143, 159, 3, 29, 248, 296, 50, 3, 15, 15385, 233, 17270, 132, 530, 3, 9, 3706, 8036, 17, 233]\n"]}]},{"cell_type":"markdown","source":["# Few shot learning"],"metadata":{"id":"UpluhM8cU5Ir"}},{"cell_type":"code","source":["print(parsed_dataset[0]) #0\n","print(parsed_dataset[123]) #1\n","print(parsed_dataset[2000]) #0\n","print(parsed_dataset[3002]) #1"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"7uNUkixPU85O","executionInfo":{"status":"ok","timestamp":1676655779500,"user_tz":-60,"elapsed":19,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"29ccefa4-8bf2-4753-cb89-7b25260dd24d"},"execution_count":9,"outputs":[{"output_type":"stream","name":"stdout","text":["{'sms': 'Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...', 'label': 'False'}\n","{'sms': 'Todays Voda numbers ending 7548 are selected to receive a $350 award. If you have a match please call 08712300220 quoting claim code 4041 standard rates app', 'label': 'True'}\n","{'sms': \"LMAO where's your fish memory when I need it?\", 'label': 'False'}\n","{'sms': 'This message is free. Welcome to the new & improved Sex & Dogging club! To unsubscribe from this service reply STOP. msgs@150p 18+only', 'label': 'True'}\n"]}]},{"cell_type":"code","source":["non_spam_1 = \"The text message: \" + parsed_dataset[0]['sms'] + \"\\nIs this sms spam? Ans: False\\n\\n\"\n","spam_1 = \"The text message: \" + parsed_dataset[123]['sms'] + \"\\nIs this sms spam? Ans: True\\n\\n\"\n","non_spam_2 = \"The text message: \" + parsed_dataset[2000]['sms'] + \"\\nIs this sms spam? Ans: False\\n\\n\"\n","spam_2 = \"The text message: \" + parsed_dataset[3002]['sms'] + \"\\nIs this sms spam? Ans: True\\n\\n\"\n","\n","few_shot_prefix = non_spam_1 + spam_1 + non_spam_2 + spam_2 + \"The text message: \"\n","print(few_shot_prefix)"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"lj0issBznZfK","executionInfo":{"status":"ok","timestamp":1676655779500,"user_tz":-60,"elapsed":17,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"c4d190c1-49fa-4a55-f019-a342c165e517"},"execution_count":10,"outputs":[{"output_type":"stream","name":"stdout","text":["The text message: Go until jurong point, crazy.. Available only in bugis n great world la e buffet... Cine there got amore wat...\n","Is this sms spam? Ans: False\n","\n","The text message: Todays Voda numbers ending 7548 are selected to receive a $350 award. If you have a match please call 08712300220 quoting claim code 4041 standard rates app\n","Is this sms spam? Ans: True\n","\n","The text message: LMAO where's your fish memory when I need it?\n","Is this sms spam? Ans: False\n","\n","The text message: This message is free. Welcome to the new & improved Sex & Dogging club! To unsubscribe from this service reply STOP. msgs@150p 18+only\n","Is this sms spam? Ans: True\n","\n","The text message: \n"]}]},{"cell_type":"markdown","source":["# Load FLAN-T5 model"],"metadata":{"id":"okTx_ynMV0rH"}},{"cell_type":"code","source":["from transformers import AutoModelForSeq2SeqLM"],"metadata":{"id":"Eu-7Eed8WgN0","executionInfo":{"status":"ok","timestamp":1676655779501,"user_tz":-60,"elapsed":16,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}}},"execution_count":11,"outputs":[]},{"cell_type":"code","source":["model = AutoModelForSeq2SeqLM.from_pretrained('google/flan-t5-large')\n","\n","model.cuda()"],"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":1000,"referenced_widgets":["902d51de5d15490b8e40d51cb9d2a6d7","f745f516f9814e7293f677e50eaded2f","7761bcc878504db19a4b2662cfdf61a9","ab1cfad8dc994780b6b980b751531e0e","356fa367dabf4efb9c0f858bcd582db5","a76f15514a734a2ca57c95d6e5d28c1a","2895697d2a7b4a4988cb782b45744af0","c5ff7a768dc6432cab747b037bc99480","233a81cabbbe404e87d98de3eb641fc0","d7950561457141e98485648c507beae4","e2a49b71a2be4b818d34549552158f21","8b43cd40eb594e3d974fb47a63013eba","ca360690cbc348fcb0b594cc56434017","b95287e1033b4645a21029cb4ffab619","81ea2572afde4cb09ac364307785d38d","23bbfb2b32044784a49e7b08b90e1302","33ca6db178b84da19661fc3d62e09abb","2da3ecb995514cb7a2fac91f49165f24","994a0a3fb8de4798bc5c3e34b27d2aa0","15896f0b77164af7bdeb365755b3d478","f1566112e762430397c9116cca9aa39b","d33d0c19f0b542c5ac07ac1f2858e3a7","b135be3639114a6ab0c587f08a889c82","9d8979ec18384dc2a297ce9a68d9bd9c","3cce22420ff046d9872b08ce23e725a1","f057f834fc8c45e4b46809f2ee1abad9","2b0d399693ec4f8b9065e477fb573e1a","d53e8179d299450083ddf7e2cb1e473e","7b38475b1275447cae202d0b60e6a207","c27eec62191a46b7b37dbb72d3e7e864","5d250db552db494a815fa3ea51592e68","fd3fec011f284d05b5d7d5e906174582","a40e99f09452422b9460d9ec7a5f127e"]},"id":"JKv9O8kfV2zZ","executionInfo":{"status":"ok","timestamp":1676655814395,"user_tz":-60,"elapsed":34910,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"2f44a817-5096-4dfb-920e-2b92c3cc95d6"},"execution_count":12,"outputs":[{"output_type":"display_data","data":{"text/plain":["Downloading (…)lve/main/config.json: 0%| | 0.00/662 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"902d51de5d15490b8e40d51cb9d2a6d7"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)\"pytorch_model.bin\";: 0%| | 0.00/3.13G [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"8b43cd40eb594e3d974fb47a63013eba"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Downloading (…)neration_config.json: 0%| | 0.00/147 [00:00<?, ?B/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"b135be3639114a6ab0c587f08a889c82"}},"metadata":{}},{"output_type":"execute_result","data":{"text/plain":["T5ForConditionalGeneration(\n"," (shared): Embedding(32128, 1024)\n"," (encoder): T5Stack(\n"," (embed_tokens): Embedding(32128, 1024)\n"," (block): ModuleList(\n"," (0): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," (relative_attention_bias): Embedding(32, 16)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (1): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (2): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (3): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (4): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (5): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (6): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (7): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (8): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (9): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (10): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (11): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (12): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (13): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (14): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (15): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (16): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (17): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (18): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (19): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (20): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (21): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (22): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (23): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," )\n"," (final_layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (decoder): T5Stack(\n"," (embed_tokens): Embedding(32128, 1024)\n"," (block): ModuleList(\n"," (0): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," (relative_attention_bias): Embedding(32, 16)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (1): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (2): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (3): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (4): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (5): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (6): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (7): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (8): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (9): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (10): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (11): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (12): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (13): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (14): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (15): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (16): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (17): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (18): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (19): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (20): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (21): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (22): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," (23): T5Block(\n"," (layer): ModuleList(\n"," (0): T5LayerSelfAttention(\n"," (SelfAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (1): T5LayerCrossAttention(\n"," (EncDecAttention): T5Attention(\n"," (q): Linear(in_features=1024, out_features=1024, bias=False)\n"," (k): Linear(in_features=1024, out_features=1024, bias=False)\n"," (v): Linear(in_features=1024, out_features=1024, bias=False)\n"," (o): Linear(in_features=1024, out_features=1024, bias=False)\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (2): T5LayerFF(\n"," (DenseReluDense): T5DenseGatedActDense(\n"," (wi_0): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wi_1): Linear(in_features=1024, out_features=2816, bias=False)\n"," (wo): Linear(in_features=2816, out_features=1024, bias=False)\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," (act): NewGELUActivation()\n"," )\n"," (layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," )\n"," )\n"," )\n"," (final_layer_norm): T5LayerNorm()\n"," (dropout): Dropout(p=0.1, inplace=False)\n"," )\n"," (lm_head): Linear(in_features=1024, out_features=32128, bias=False)\n",")"]},"metadata":{},"execution_count":12}]},{"cell_type":"markdown","source":["# Helper functions"],"metadata":{"id":"F_SDAwxoawDy"}},{"cell_type":"code","source":["import torch"],"metadata":{"id":"rdWMg_KJZEZH","executionInfo":{"status":"ok","timestamp":1676655814396,"user_tz":-60,"elapsed":17,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}}},"execution_count":13,"outputs":[]},{"cell_type":"code","source":["def calculate_accuracy(preds, target):\n"," results_ok = 0.0\n"," results_false = 0.0\n","\n"," for idx, pred in enumerate(preds):\n"," if pred == target[idx]:\n"," results_ok += 1.0\n"," else:\n"," results_false += 1.0\n","\n"," return results_ok / (results_ok + results_false)"],"metadata":{"id":"FzUi8908ax61","executionInfo":{"status":"ok","timestamp":1676655814396,"user_tz":-60,"elapsed":16,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}}},"execution_count":14,"outputs":[]},{"cell_type":"code","source":["if torch.cuda.is_available(): \n"," device = torch.device(\"cuda\")\n","\n"," print('There are %d GPU(s) available.' % torch.cuda.device_count())\n"," print('We will use the GPU:', torch.cuda.get_device_name(0))\n","\n","else:\n"," print('No GPU available, using the CPU instead.')\n"," device = torch.device(\"cpu\")"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"86i7iRmtW-6L","executionInfo":{"status":"ok","timestamp":1676655814397,"user_tz":-60,"elapsed":17,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"65d2b65e-db13-4e50-eb08-809dc9abe70a"},"execution_count":15,"outputs":[{"output_type":"stream","name":"stdout","text":["There are 1 GPU(s) available.\n","We will use the GPU: Tesla T4\n"]}]},{"cell_type":"markdown","source":["# Predykcja"],"metadata":{"id":"H_YI3bS3VHQE"}},{"cell_type":"code","source":["parsed_dataset = parsed_dataset[1:123] + parsed_dataset[124:2000] + parsed_dataset[2001:3002] + parsed_dataset[3003:]\n","predictions = []\n","expected = []\n","\n","for row in parsed_dataset:\n"," input_text = few_shot_prefix + row['sms'] + \"\\nIs this sms spam? Ans: \"\n"," input_ids = tokenizer(input_text, return_tensors=\"pt\").input_ids.to(device)\n","\n"," generated_ids = model.generate(input_ids, do_sample=True, temperature=0.9, max_length=200)\n"," generated_text = tokenizer.decode(generated_ids[0], skip_special_tokens=True, clean_up_tokenization_spaces=True)\n"," \n"," predictions.append(generated_text)\n"," expected.append(row['label'])\n","\n","acc = calculate_accuracy(predictions, expected)\n","print(acc)"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"vunLGuBGVGmh","executionInfo":{"status":"ok","timestamp":1676656989630,"user_tz":-60,"elapsed":783918,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"965f7398-80d9-4bb9-98fb-6ea563a9be38"},"execution_count":17,"outputs":[{"output_type":"stream","name":"stdout","text":["0.20786920589292132\n"]}]},{"cell_type":"code","source":["print(\"Sample prediction: {}, expected: {}\".format(predictions[101], expected[101]))"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"20WbYZmLaDl7","executionInfo":{"status":"ok","timestamp":1676657092260,"user_tz":-60,"elapsed":499,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"1895e96b-c8a4-431f-961b-39debb09b217"},"execution_count":18,"outputs":[{"output_type":"stream","name":"stdout","text":["Sample prediction: Yes, expected: False\n"]}]},{"cell_type":"markdown","source":["# MCC Score"],"metadata":{"id":"dLYc9WXz_B1o"}},{"cell_type":"code","source":["from sklearn.metrics import matthews_corrcoef\n","\n","print('Calculating Matthews Corr. Coef. for each batch...')\n","matthews = matthews_corrcoef(expected, predictions) \n","print('Total MCC: %.3f' % matthews)"],"metadata":{"id":"hPEPpXXX_DXR","executionInfo":{"status":"ok","timestamp":1676657097378,"user_tz":-60,"elapsed":1384,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"colab":{"base_uri":"https://localhost:8080/"},"outputId":"d2545d4a-002f-4e52-e421-1e094fcb6592"},"execution_count":19,"outputs":[{"output_type":"stream","name":"stdout","text":["Calculating Matthews Corr. Coef. for each batch...\n","Total MCC: 0.050\n"]}]},{"cell_type":"markdown","source":["# Save model"],"metadata":{"id":"GPhCp068_Iwq"}},{"cell_type":"code","source":["from google.colab import drive\n","\n","drive.mount('/content/gdrive/', force_remount=True)\n","\n","output_dir = '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_6_FLAN-T5_Model'\n","print(\"Saving model to %s\" % output_dir)\n","\n","model_to_save = model.module if hasattr(model, 'module') else model\n","model_to_save.save_pretrained(output_dir)\n","tokenizer.save_pretrained(output_dir)"],"metadata":{"id":"avafCMoS_KDF","colab":{"base_uri":"https://localhost:8080/"},"executionInfo":{"status":"ok","timestamp":1676657142469,"user_tz":-60,"elapsed":41097,"user":{"displayName":"Mike4 Studia4","userId":"02075505067789671500"}},"outputId":"9de1a74c-d045-4213-d20c-867328fae84c"},"execution_count":20,"outputs":[{"output_type":"stream","name":"stdout","text":["Mounted at /content/gdrive/\n","Saving model to /content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_6_FLAN-T5_Model\n"]},{"output_type":"execute_result","data":{"text/plain":["('/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_6_FLAN-T5_Model/tokenizer_config.json',\n"," '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_6_FLAN-T5_Model/special_tokens_map.json',\n"," '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_6_FLAN-T5_Model/spiece.model',\n"," '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_6_FLAN-T5_Model/added_tokens.json',\n"," '/content/gdrive/My Drive/UAM/Przetwarzanie-tekstu/Ver_6_FLAN-T5_Model/tokenizer.json')"]},"metadata":{},"execution_count":20}]},{"cell_type":"markdown","source":["# Bibliografia\n","- https://huggingface.co/docs/transformers/main/en/model_doc/flan-t5\n","- https://mccormickml.com/2019/07/22/BERT-fine-tuning/#a1-saving--loading-fine-tuned-model\n","- https://huggingface.co/docs/transformers/model_doc/t5#training"],"metadata":{"id":"wHzm2_nDA6i-"}}]}