{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"provenance":[],"gpuType":"T4"},"kernelspec":{"name":"python3","display_name":"Python 3"},"language_info":{"name":"python"},"accelerator":"GPU","widgets":{"application/vnd.jupyter.widget-state+json":{"d5c5ea1d714841ebaa50471b18921583":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_49ee874706834cd79b573c8dea02dda0","IPY_MODEL_1945020199f943bfaeb8f3c66d7f7abf","IPY_MODEL_318b3cae62bd40c8a869d1ca685c6e7d"],"layout":"IPY_MODEL_29de997088204f5480c99fc2ce70686d"}},"49ee874706834cd79b573c8dea02dda0":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_45a3dcf6739945dfb991f61d98e01a5b","placeholder":"​","style":"IPY_MODEL_2eb60cbf0e10400bae1b7c0197aa5571","value":"Generating train split: "}},"1945020199f943bfaeb8f3c66d7f7abf":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_83da63b76d104538bcce2580070be257","max":1,"min":0,"orientation":"horizontal","style":"IPY_MODEL_2dd818177e634030b2a8e6692ed9f0b7","value":1}},"318b3cae62bd40c8a869d1ca685c6e7d":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_54f40e972b9c47b09c03d743dce8d723","placeholder":"​","style":"IPY_MODEL_5432f505af174bf7b93d23829735585f","value":" 907/0 [00:00<00:00, 10251.29 examples/s]"}},"29de997088204f5480c99fc2ce70686d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"45a3dcf6739945dfb991f61d98e01a5b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2eb60cbf0e10400bae1b7c0197aa5571":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"83da63b76d104538bcce2580070be257":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":"20px"}},"2dd818177e634030b2a8e6692ed9f0b7":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"54f40e972b9c47b09c03d743dce8d723":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5432f505af174bf7b93d23829735585f":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"f47e40310eb74543bdd794c1a7bba21a":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_ae5a642c07d74b6abd2fd4bdce17b99a","IPY_MODEL_bb68eaad5e7547ecb0f11954fed9cd13","IPY_MODEL_51bceeb2159649dabba7c75353e6b884"],"layout":"IPY_MODEL_2b6334a76ee14c5b8075d3c94bce9ba3"}},"ae5a642c07d74b6abd2fd4bdce17b99a":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_c68a58962b484dde8d97fb29bae77f7a","placeholder":"​","style":"IPY_MODEL_9b4bc4d8ab0f4e84a7bc9904abb1e4df","value":"Generating train split: "}},"bb68eaad5e7547ecb0f11954fed9cd13":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_51a44c129f45401b992804b835f8d892","max":1,"min":0,"orientation":"horizontal","style":"IPY_MODEL_342a072b44474941b5740fcfb3b30a84","value":1}},"51bceeb2159649dabba7c75353e6b884":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_ce392d2df29d433d842d76b065f294df","placeholder":"​","style":"IPY_MODEL_9c6cb03133174858b34d8155da9edd34","value":" 101/0 [00:00<00:00, 2518.46 examples/s]"}},"2b6334a76ee14c5b8075d3c94bce9ba3":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c68a58962b484dde8d97fb29bae77f7a":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"9b4bc4d8ab0f4e84a7bc9904abb1e4df":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"51a44c129f45401b992804b835f8d892":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":"20px"}},"342a072b44474941b5740fcfb3b30a84":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"ce392d2df29d433d842d76b065f294df":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"9c6cb03133174858b34d8155da9edd34":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"6fe73e0cf3904745b9248c334f880c28":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_c25cbd8181d44a2e8fbdc3b2eb16dc8e","IPY_MODEL_e3187f7f601e4629860aae118c71a632","IPY_MODEL_ab3616254eab47da982534d1c6b39a20"],"layout":"IPY_MODEL_b27bdb7cb1834645bef01185e472ba96"}},"c25cbd8181d44a2e8fbdc3b2eb16dc8e":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_2759c474436f4dbcaac4052f920ca2d9","placeholder":"​","style":"IPY_MODEL_78ce8a6e9b8b46d0b0b7e1fb79aa634b","value":"Map: 100%"}},"e3187f7f601e4629860aae118c71a632":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_72111bbd48fa4d0fab5b504820a99147","max":907,"min":0,"orientation":"horizontal","style":"IPY_MODEL_4096fa6746f84a7880fd39e63688586a","value":907}},"ab3616254eab47da982534d1c6b39a20":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_017ed39c30094ef3afc2ecff578f1ada","placeholder":"​","style":"IPY_MODEL_f30d048c00e144d59fa646f89daa1f44","value":" 907/907 [00:00<00:00, 17333.34 examples/s]"}},"b27bdb7cb1834645bef01185e472ba96":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2759c474436f4dbcaac4052f920ca2d9":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"78ce8a6e9b8b46d0b0b7e1fb79aa634b":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"72111bbd48fa4d0fab5b504820a99147":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"4096fa6746f84a7880fd39e63688586a":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"017ed39c30094ef3afc2ecff578f1ada":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"f30d048c00e144d59fa646f89daa1f44":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"ce736d0a74f14af7a6294316ce461d8c":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_a62fbbad7f364704915f77994a035e7b","IPY_MODEL_c1cef37ac9ad41129c4b7238083f3be6","IPY_MODEL_1f035af160ee418090955908a916680d"],"layout":"IPY_MODEL_f24118bf6102414bafd8536829ef6c72"}},"a62fbbad7f364704915f77994a035e7b":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_5cb0ed2cf6f8450ba18124eac9d50c65","placeholder":"​","style":"IPY_MODEL_d43477b97e244b7c8e0db1804bb66f64","value":"Map: 100%"}},"c1cef37ac9ad41129c4b7238083f3be6":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_e3107883fe45458c80f04b8d97d590ef","max":101,"min":0,"orientation":"horizontal","style":"IPY_MODEL_3a345aee1b84453c81ab43c46c9f19e0","value":101}},"1f035af160ee418090955908a916680d":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_a6c6abe3e03e4b159f12ba238cdb9f5b","placeholder":"​","style":"IPY_MODEL_e51299eb1fe44ab49765533c1ba07213","value":" 101/101 [00:00<00:00, 3191.89 examples/s]"}},"f24118bf6102414bafd8536829ef6c72":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5cb0ed2cf6f8450ba18124eac9d50c65":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d43477b97e244b7c8e0db1804bb66f64":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"e3107883fe45458c80f04b8d97d590ef":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"3a345aee1b84453c81ab43c46c9f19e0":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"a6c6abe3e03e4b159f12ba238cdb9f5b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"e51299eb1fe44ab49765533c1ba07213":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"d629b70853fa487993faea1ee0cf4726":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_b4b7a50dfd4948f080d6154a2320ce39","IPY_MODEL_ccad49aabf244912a2cd31fdf0539346","IPY_MODEL_2aa452b945f147bfa3d526268306dbc9"],"layout":"IPY_MODEL_0661356c6f244550a77e4905797ddb8c"}},"b4b7a50dfd4948f080d6154a2320ce39":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_25e654668f21430c9ddd442e3a8296ab","placeholder":"​","style":"IPY_MODEL_14ea45e8dc3f4e639250c7529a067cd6","value":"config.json: 100%"}},"ccad49aabf244912a2cd31fdf0539346":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_c32cec29c8ab43b4a0e75529788be458","max":608,"min":0,"orientation":"horizontal","style":"IPY_MODEL_9be4b3daa9854cdfb417a491034bd685","value":608}},"2aa452b945f147bfa3d526268306dbc9":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_0cfe6a5c6b1b46d6af9eca957fcb1aad","placeholder":"​","style":"IPY_MODEL_7c29dd58a55d460fb75be73ded0fc4d4","value":" 608/608 [00:00<00:00, 42.9kB/s]"}},"0661356c6f244550a77e4905797ddb8c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"25e654668f21430c9ddd442e3a8296ab":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"14ea45e8dc3f4e639250c7529a067cd6":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"c32cec29c8ab43b4a0e75529788be458":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"9be4b3daa9854cdfb417a491034bd685":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"0cfe6a5c6b1b46d6af9eca957fcb1aad":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"7c29dd58a55d460fb75be73ded0fc4d4":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"295a0f6f36fd43b295a95468bb39d243":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_2aa484cb82d34c9a9e577bacc3738eb9","IPY_MODEL_5ef1d52e49704331b691badd4846f27f","IPY_MODEL_922131fa258c45afbd016364e7925db3"],"layout":"IPY_MODEL_6698a1acffd746138a5faddb83d67443"}},"2aa484cb82d34c9a9e577bacc3738eb9":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_40ff95bbc3a5416c9fa5ff050908542d","placeholder":"​","style":"IPY_MODEL_198f9be1b3834529afa679d58168996b","value":"model.safetensors: 100%"}},"5ef1d52e49704331b691badd4846f27f":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_72949b1855e64ae7adbf36e7e96ff2d4","max":2200119864,"min":0,"orientation":"horizontal","style":"IPY_MODEL_984290bd8a8447e39d53179ce09e919e","value":2200119864}},"922131fa258c45afbd016364e7925db3":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_2a183bc6e12a4b6e994af4ddf2e9ea96","placeholder":"​","style":"IPY_MODEL_1c1f1b8dbf6b4f329e97363bdf5296f1","value":" 2.20G/2.20G [00:18<00:00, 187MB/s]"}},"6698a1acffd746138a5faddb83d67443":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"40ff95bbc3a5416c9fa5ff050908542d":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"198f9be1b3834529afa679d58168996b":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"72949b1855e64ae7adbf36e7e96ff2d4":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"984290bd8a8447e39d53179ce09e919e":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"2a183bc6e12a4b6e994af4ddf2e9ea96":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"1c1f1b8dbf6b4f329e97363bdf5296f1":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"2bb6cd8c97c04bfdbb1ff5cb1df0c695":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_c295ab38792f4e07a9259ebaa5ef0e80","IPY_MODEL_41dec290aa9e40e184be78f56a61d1e3","IPY_MODEL_dc56f926dc804233a692263c18f74451"],"layout":"IPY_MODEL_16c0c840aa644bb6897a9f878b3b3d8e"}},"c295ab38792f4e07a9259ebaa5ef0e80":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_3ec08f71a216435199db9d7bd94dd549","placeholder":"​","style":"IPY_MODEL_66d57732c7784b2099fa25e1cee34edc","value":"generation_config.json: 100%"}},"41dec290aa9e40e184be78f56a61d1e3":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_59f57fccb6594fa296ff2922b056757f","max":124,"min":0,"orientation":"horizontal","style":"IPY_MODEL_81e89c63eb9043c380b453d538e9f863","value":124}},"dc56f926dc804233a692263c18f74451":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_e7735a0ac9f445bb8dfac633fa4a55a6","placeholder":"​","style":"IPY_MODEL_60b80a001bcb4cbe89609f664b3a13cd","value":" 124/124 [00:00<00:00, 2.65kB/s]"}},"16c0c840aa644bb6897a9f878b3b3d8e":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"3ec08f71a216435199db9d7bd94dd549":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"66d57732c7784b2099fa25e1cee34edc":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"59f57fccb6594fa296ff2922b056757f":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"81e89c63eb9043c380b453d538e9f863":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"e7735a0ac9f445bb8dfac633fa4a55a6":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"60b80a001bcb4cbe89609f664b3a13cd":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"b10e3e347ca9482ab7c6ddc19771f390":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_b6a3fc218dbd4c148269d4d126f562c5","IPY_MODEL_2be746a7384f4e548748f41ae15f04bc","IPY_MODEL_79cd509f4d4442feb07648293091494e"],"layout":"IPY_MODEL_075a480797f3451e895dcb8320f8585c"}},"b6a3fc218dbd4c148269d4d126f562c5":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_766ad188034445089ff07df1083b358b","placeholder":"​","style":"IPY_MODEL_15d76ae631d84f6ebaf30894b3f87208","value":"tokenizer_config.json: 100%"}},"2be746a7384f4e548748f41ae15f04bc":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_bff31cea15ce424aabfaa462aeffd0eb","max":1289,"min":0,"orientation":"horizontal","style":"IPY_MODEL_5e5dfc4000a14d438fb8e7977a0fdd4f","value":1289}},"79cd509f4d4442feb07648293091494e":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_d2dfe13824614a97b0d51fcc33104df7","placeholder":"​","style":"IPY_MODEL_8b4a8eafdf5c4aef9fb1af9e1c9fcc89","value":" 1.29k/1.29k [00:00<00:00, 25.8kB/s]"}},"075a480797f3451e895dcb8320f8585c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"766ad188034445089ff07df1083b358b":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"15d76ae631d84f6ebaf30894b3f87208":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"bff31cea15ce424aabfaa462aeffd0eb":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5e5dfc4000a14d438fb8e7977a0fdd4f":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"d2dfe13824614a97b0d51fcc33104df7":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"8b4a8eafdf5c4aef9fb1af9e1c9fcc89":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"7eaf88d0d8cd4d1bb9560f390c8cb9f7":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_fa22d5e9f45249d7b5c968d0c44bacd6","IPY_MODEL_5359f42614d3407cae29c3ef6a0307e3","IPY_MODEL_368b0ffdc8ff4c43a53ae7f6fb634625"],"layout":"IPY_MODEL_4891ab22ae8b485a87191749f43c92a4"}},"fa22d5e9f45249d7b5c968d0c44bacd6":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_dc767d3a60a645a5a2ad567d3ab99c6c","placeholder":"​","style":"IPY_MODEL_633491710aec459c8bf90d17b5aceec5","value":"tokenizer.model: 100%"}},"5359f42614d3407cae29c3ef6a0307e3":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_533fdbc97b994ba98b32a8cd9d931704","max":499723,"min":0,"orientation":"horizontal","style":"IPY_MODEL_d315689fcca14cc6842135c5a50ea869","value":499723}},"368b0ffdc8ff4c43a53ae7f6fb634625":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_cc021d0b2a8c45a09f1adef31ef2ea20","placeholder":"​","style":"IPY_MODEL_6d2b8939dbeb41499ce6f522100d48ac","value":" 500k/500k [00:00<00:00, 11.0MB/s]"}},"4891ab22ae8b485a87191749f43c92a4":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"dc767d3a60a645a5a2ad567d3ab99c6c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"633491710aec459c8bf90d17b5aceec5":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"533fdbc97b994ba98b32a8cd9d931704":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d315689fcca14cc6842135c5a50ea869":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"cc021d0b2a8c45a09f1adef31ef2ea20":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"6d2b8939dbeb41499ce6f522100d48ac":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"52a8901770774d8c9e44f53f6e91da76":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_530de79692d844ccbe1d08e7918e48c1","IPY_MODEL_05bfc8bef5e5478cbc3a0c3751b44183","IPY_MODEL_e308536476d24581b3720c17797d12fe"],"layout":"IPY_MODEL_ee820716ebdf4690ac37c691602c251c"}},"530de79692d844ccbe1d08e7918e48c1":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_0cf5639c60df4325af48237ba978b033","placeholder":"​","style":"IPY_MODEL_982fbbe7a6ab47199bf0a165cdcc5a1e","value":"tokenizer.json: 100%"}},"05bfc8bef5e5478cbc3a0c3751b44183":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_b4e8632c52f1437d8b08f0054ef5d616","max":1842767,"min":0,"orientation":"horizontal","style":"IPY_MODEL_103f3b13e3d04df599052ad74e2b3b44","value":1842767}},"e308536476d24581b3720c17797d12fe":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_82759aad7e68475fbca07d8b62cce1f4","placeholder":"​","style":"IPY_MODEL_9587e07d43934de1b335e28f22e0a6ee","value":" 1.84M/1.84M [00:00<00:00, 7.33MB/s]"}},"ee820716ebdf4690ac37c691602c251c":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"0cf5639c60df4325af48237ba978b033":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"982fbbe7a6ab47199bf0a165cdcc5a1e":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"b4e8632c52f1437d8b08f0054ef5d616":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"103f3b13e3d04df599052ad74e2b3b44":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"82759aad7e68475fbca07d8b62cce1f4":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"9587e07d43934de1b335e28f22e0a6ee":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"9d70f571292949858abbbe7a16a7f796":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_ef84883204c54b46b8a45e1abb2c1cbf","IPY_MODEL_8612805ad8db47a785a10e23a7e7cda6","IPY_MODEL_e5055fb332a74b4589a687e24a53b80d"],"layout":"IPY_MODEL_f9bb0b0e91bd4e058d7be35115ffe2ae"}},"ef84883204c54b46b8a45e1abb2c1cbf":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_310938d0886e406d84831980d7aefc33","placeholder":"​","style":"IPY_MODEL_d9376fad2b904e9dbee26d8618dea869","value":"special_tokens_map.json: 100%"}},"8612805ad8db47a785a10e23a7e7cda6":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_11dc1c32eb4f4b2f8d1f7040a26a8bcc","max":551,"min":0,"orientation":"horizontal","style":"IPY_MODEL_be25eaa051da444183082fb2213b987c","value":551}},"e5055fb332a74b4589a687e24a53b80d":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_f7e403f42ba84d49b73435be127ef4f1","placeholder":"​","style":"IPY_MODEL_5c9550a85ba94d72b6ddeed9719bf2c1","value":" 551/551 [00:00<00:00, 15.7kB/s]"}},"f9bb0b0e91bd4e058d7be35115ffe2ae":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"310938d0886e406d84831980d7aefc33":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"d9376fad2b904e9dbee26d8618dea869":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"11dc1c32eb4f4b2f8d1f7040a26a8bcc":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"be25eaa051da444183082fb2213b987c":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"f7e403f42ba84d49b73435be127ef4f1":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"5c9550a85ba94d72b6ddeed9719bf2c1":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"db60994a46574e8882e76aec5b935414":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_a6a2a2ca9247490389ace681ebbb8dfc","IPY_MODEL_f29baf8e03ff46cc9ddbe9f0ed8cb3ec","IPY_MODEL_d67b0a36d0e24d17b6bba783f7aba28f"],"layout":"IPY_MODEL_fc00219559854805800912d554083ec2"}},"a6a2a2ca9247490389ace681ebbb8dfc":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_ebb90429a0874ce29deddc2a0dc65728","placeholder":"​","style":"IPY_MODEL_2818a278711948cb83c09b97debc1e59","value":"Map: 100%"}},"f29baf8e03ff46cc9ddbe9f0ed8cb3ec":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_b0d77284ea6741948c2a4cac4cd33728","max":907,"min":0,"orientation":"horizontal","style":"IPY_MODEL_fbbef0b2819c4f6e9bb672650a707c3a","value":907}},"d67b0a36d0e24d17b6bba783f7aba28f":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_13adfde84c244c40bbe73651893eff38","placeholder":"​","style":"IPY_MODEL_fd9d2367784d49b69a82e657e1f3d3cd","value":" 907/907 [00:00<00:00, 2796.34 examples/s]"}},"fc00219559854805800912d554083ec2":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"ebb90429a0874ce29deddc2a0dc65728":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"2818a278711948cb83c09b97debc1e59":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"b0d77284ea6741948c2a4cac4cd33728":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fbbef0b2819c4f6e9bb672650a707c3a":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"13adfde84c244c40bbe73651893eff38":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"fd9d2367784d49b69a82e657e1f3d3cd":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"8ae0dab917f948ae916f830a8f334551":{"model_module":"@jupyter-widgets/controls","model_name":"HBoxModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HBoxModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HBoxView","box_style":"","children":["IPY_MODEL_1835720fe19a4263b8b9b2d9f2bf5d63","IPY_MODEL_d2e71a1404f543eb99108bb601117866","IPY_MODEL_d66128c70c674ff7be447f44b9822b1e"],"layout":"IPY_MODEL_e2a2edd8d1074faa95e5cf4909777831"}},"1835720fe19a4263b8b9b2d9f2bf5d63":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_50db724e0085406baf99e4eb6147c52f","placeholder":"​","style":"IPY_MODEL_736b49399e7041709287fab4ea4d4763","value":"Map: 100%"}},"d2e71a1404f543eb99108bb601117866":{"model_module":"@jupyter-widgets/controls","model_name":"FloatProgressModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"FloatProgressModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"ProgressView","bar_style":"success","description":"","description_tooltip":null,"layout":"IPY_MODEL_2b0da50a5aba444b82d86a04c5b4d730","max":101,"min":0,"orientation":"horizontal","style":"IPY_MODEL_53862fdf58eb49929f337c6e2b6b284f","value":101}},"d66128c70c674ff7be447f44b9822b1e":{"model_module":"@jupyter-widgets/controls","model_name":"HTMLModel","model_module_version":"1.5.0","state":{"_dom_classes":[],"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"HTMLModel","_view_count":null,"_view_module":"@jupyter-widgets/controls","_view_module_version":"1.5.0","_view_name":"HTMLView","description":"","description_tooltip":null,"layout":"IPY_MODEL_a0e4da779e4a4139b66340fd955587ed","placeholder":"​","style":"IPY_MODEL_c712ecf37b34487f9a0f109191f44681","value":" 101/101 [00:00<00:00, 1041.19 examples/s]"}},"e2a2edd8d1074faa95e5cf4909777831":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"50db724e0085406baf99e4eb6147c52f":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"736b49399e7041709287fab4ea4d4763":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}},"2b0da50a5aba444b82d86a04c5b4d730":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"53862fdf58eb49929f337c6e2b6b284f":{"model_module":"@jupyter-widgets/controls","model_name":"ProgressStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"ProgressStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","bar_color":null,"description_width":""}},"a0e4da779e4a4139b66340fd955587ed":{"model_module":"@jupyter-widgets/base","model_name":"LayoutModel","model_module_version":"1.2.0","state":{"_model_module":"@jupyter-widgets/base","_model_module_version":"1.2.0","_model_name":"LayoutModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"LayoutView","align_content":null,"align_items":null,"align_self":null,"border":null,"bottom":null,"display":null,"flex":null,"flex_flow":null,"grid_area":null,"grid_auto_columns":null,"grid_auto_flow":null,"grid_auto_rows":null,"grid_column":null,"grid_gap":null,"grid_row":null,"grid_template_areas":null,"grid_template_columns":null,"grid_template_rows":null,"height":null,"justify_content":null,"justify_items":null,"left":null,"margin":null,"max_height":null,"max_width":null,"min_height":null,"min_width":null,"object_fit":null,"object_position":null,"order":null,"overflow":null,"overflow_x":null,"overflow_y":null,"padding":null,"right":null,"top":null,"visibility":null,"width":null}},"c712ecf37b34487f9a0f109191f44681":{"model_module":"@jupyter-widgets/controls","model_name":"DescriptionStyleModel","model_module_version":"1.5.0","state":{"_model_module":"@jupyter-widgets/controls","_model_module_version":"1.5.0","_model_name":"DescriptionStyleModel","_view_count":null,"_view_module":"@jupyter-widgets/base","_view_module_version":"1.2.0","_view_name":"StyleView","description_width":""}}}}},"cells":[{"cell_type":"markdown","source":["## **Trabalho Prático Final de NLP**\n","### **Etapa 3: Treinamento do Modelo com o LORA**\n","**Professores:** André Carvalho e Altigran da Silva\n","\n","**Alunos:**\n","\n","\n","Bianka Vasconcelos\n","\n","Girlana Souza\n","\n","Ricardo Bonfim\n","\n","\n","**Descrição do Trabalho:** Este trabalho consiste em desenvolver uma LLM que responda perguntas sobre a legislação acadêmica da UFAM. O trabalho envolve o download e pré-processamento dos documentos da legislação, a criação de uma base de dados sintética de instruções, o treinamento do modelo usando técnicas de LoRA/QLoRA, e a implementação de um sistema de RAG (Retrieval-Augmented Generation) para fornecer respostas precisas baseadas nos documentos da legislação."],"metadata":{"id":"LscUkoXKkFDF"}},{"cell_type":"markdown","source":["### **Objetivo:** Neste notebook, iremos fazer o treinamento do modelo de linguagem Tiny Llama usando LORA. Para isso, usaremos a base de dados sintética de instruções que foi criada na etapa 2."],"metadata":{"id":"KHnqF5jXhogA"}},{"cell_type":"markdown","source":["### **Configurando o ambiente**\n","\n","Vamos começar com algumas instalações e importações básicas para configurar o ambiente."],"metadata":{"id":"EUE_b1yPh3MX"}},{"cell_type":"code","source":["!pip install datasets\n","!pip install peft\n","!pip install trl\n","# !pip install -i https://pypi.org/simple/ bitsandbytes\n","!pip install accelerate\n","!pip install -U bitsandbytes\n","!pip install pyarrow==6.0.1\n","!pip install sentence_transformers # para a similaridade do cosseno"],"metadata":{"id":"s68XR2rSmjwH"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["import os\n","import random\n","import torch\n","import logging\n","from datasets import load_dataset\n","from transformers import (\n"," AutoModelForCausalLM,\n"," AutoTokenizer,\n"," BitsAndBytesConfig,\n"," HfArgumentParser,\n"," TrainingArguments,\n"," pipeline,\n"," logging,\n",")\n","from peft import LoraConfig, PeftModel\n","from trl import SFTTrainer\n","from transformers import pipeline\n","import pandas as pd\n","from huggingface_hub import notebook_login\n","from sentence_transformers import SentenceTransformer, util"],"metadata":{"id":"15RULuK0klsy"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["### **Carregando a base de dados**\n","\n","Agora, vamos carregar a base de dados sintética de instruções. Ela será carregada do nosso repositório no google drive e armazenada em um dataframe."],"metadata":{"id":"aWG7dyXpibaU"}},{"cell_type":"code","source":["# carregando base de dados\n","from google.colab import drive\n","import pandas as pd\n","import numpy as np\n","\n","# montar google drive\n","drive.mount('/content/drive')"],"metadata":{"id":"4pu5n9Cem6he","colab":{"base_uri":"https://localhost:8080/"},"outputId":"cf99b6a1-ad71-4639-abd4-d9031daeb832"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Mounted at /content/drive\n"]}]},{"cell_type":"code","source":["df = pd.read_csv(\"/content/drive/My Drive/TP3 (Final)/Trabalho Final de NLP/instrucoes.csv\")\n","df"],"metadata":{"id":"UhWYZj8WnGdW","colab":{"base_uri":"https://localhost:8080/","height":424},"outputId":"516d691d-9f2c-4dcd-e14b-22026c7f07d9"},"execution_count":null,"outputs":[{"output_type":"execute_result","data":{"text/plain":[" Q \\\n","0 What does article 4 say regarding students who... \n","1 How many days after publication would it take ... \n","2 In which year did President Luiz Inacio Lula D... \n","3 Is there an exception allowing someone current... \n","4 Can you enroll in only a single vacancy even i... \n","... ... \n","1032 Is there flexibility allowed in terms of proje... \n","1033 Are qualifications required for teaching staff... \n","1034 Does infrastructure play a role in determining... \n","1035 Will financial resources impact an institute's... \n","1036 Do students who complete recognized degree pro... \n","\n"," A \n","0 Article 4 states that such students will still... \n","1 This law becomes effective thirty days from it... \n","2 Law 12.089 was signed by him in November of 2009 \n","3 Yes \n","4 No \n","... ... \n","1032 No specific details were mentioned explicitly ... \n","1033 Academic qualification is among factors evalua... \n","1034 Infrastructure facilities form part of the par... \n","1035 Financial capacity forms part of consideration... \n","1036 This aspect has been left unclear, but presuma... \n","\n","[1037 rows x 2 columns]"],"text/html":["\n","
\n","
\n","\n","\n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n","
QA
0What does article 4 say regarding students who...Article 4 states that such students will still...
1How many days after publication would it take ...This law becomes effective thirty days from it...
2In which year did President Luiz Inacio Lula D...Law 12.089 was signed by him in November of 2009
3Is there an exception allowing someone current...Yes
4Can you enroll in only a single vacancy even i...No
.........
1032Is there flexibility allowed in terms of proje...No specific details were mentioned explicitly ...
1033Are qualifications required for teaching staff...Academic qualification is among factors evalua...
1034Does infrastructure play a role in determining...Infrastructure facilities form part of the par...
1035Will financial resources impact an institute's...Financial capacity forms part of consideration...
1036Do students who complete recognized degree pro...This aspect has been left unclear, but presuma...
\n","

1037 rows × 2 columns

\n","
\n","
\n","\n","
\n"," \n","\n"," \n","\n"," \n","
\n","\n","\n","
\n"," \n","\n","\n","\n"," \n","
\n","\n","
\n"," \n"," \n"," \n","
\n","\n","
\n","
\n"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"dataframe","variable_name":"df","summary":"{\n \"name\": \"df\",\n \"rows\": 1037,\n \"fields\": [\n {\n \"column\": \"Q\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 1004,\n \"samples\": [\n \"Under which article of LDB are distance education programs developed?\",\n \"For what purpose is the PACC prepared according to Article 22?\",\n \"For what purpose was Resolution Number 064/2011 passed?\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"A\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 998,\n \"samples\": [\n \"Like other non-student affiliated members of the institution, yes, employees also need periodic registry renewal.\",\n \"After preparing the report, it shall be forwarded to the Pro-Rectorate of Undergraduate Studies\",\n \"Eligibility relies on official reports issued by authorized healthcare officials working within the system\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}"}},"metadata":{},"execution_count":3}]},{"cell_type":"markdown","source":["Abaixo, criamos um novo dataframe com o `Q` (question) representado pelo `prompt` e o `A` (answer) representado pelo `response`."],"metadata":{"id":"EseZWa7TkOxu"}},{"cell_type":"code","source":["# Inicializar listas\n","prompts = []\n","responses = []\n","\n","# Iterar sobre cada linha do DataFrame\n","for index, row in df.iterrows():\n"," try:\n"," question = row['Q']\n"," answer = row['A']\n"," prompts.append(question.strip())\n"," responses.append(answer.strip())\n"," except:\n"," pass\n","\n","# Criar o DataFrame\n","processed_df = pd.DataFrame({\n"," 'prompt': prompts,\n"," 'response': responses\n","})\n","\n","# Remover dados duplicados\n","processed_df = processed_df.drop_duplicates()\n","processed_df"],"metadata":{"id":"imlDKJZXnLM6","colab":{"base_uri":"https://localhost:8080/","height":424},"outputId":"6c6fd061-ad16-4363-c93e-8e91216cd684"},"execution_count":null,"outputs":[{"output_type":"execute_result","data":{"text/plain":[" prompt \\\n","0 What does article 4 say regarding students who... \n","1 How many days after publication would it take ... \n","2 In which year did President Luiz Inacio Lula D... \n","3 Is there an exception allowing someone current... \n","4 Can you enroll in only a single vacancy even i... \n","... ... \n","1032 Is there flexibility allowed in terms of proje... \n","1033 Are qualifications required for teaching staff... \n","1034 Does infrastructure play a role in determining... \n","1035 Will financial resources impact an institute's... \n","1036 Do students who complete recognized degree pro... \n","\n"," response \n","0 Article 4 states that such students will still... \n","1 This law becomes effective thirty days from it... \n","2 Law 12.089 was signed by him in November of 2009 \n","3 Yes \n","4 No \n","... ... \n","1032 No specific details were mentioned explicitly ... \n","1033 Academic qualification is among factors evalua... \n","1034 Infrastructure facilities form part of the par... \n","1035 Financial capacity forms part of consideration... \n","1036 This aspect has been left unclear, but presuma... \n","\n","[1008 rows x 2 columns]"],"text/html":["\n","
\n","
\n","\n","\n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n","
promptresponse
0What does article 4 say regarding students who...Article 4 states that such students will still...
1How many days after publication would it take ...This law becomes effective thirty days from it...
2In which year did President Luiz Inacio Lula D...Law 12.089 was signed by him in November of 2009
3Is there an exception allowing someone current...Yes
4Can you enroll in only a single vacancy even i...No
.........
1032Is there flexibility allowed in terms of proje...No specific details were mentioned explicitly ...
1033Are qualifications required for teaching staff...Academic qualification is among factors evalua...
1034Does infrastructure play a role in determining...Infrastructure facilities form part of the par...
1035Will financial resources impact an institute's...Financial capacity forms part of consideration...
1036Do students who complete recognized degree pro...This aspect has been left unclear, but presuma...
\n","

1008 rows × 2 columns

\n","
\n","
\n","\n","
\n"," \n","\n"," \n","\n"," \n","
\n","\n","\n","
\n"," \n","\n","\n","\n"," \n","
\n","\n","
\n"," \n"," \n"," \n","
\n","\n","
\n","
\n"],"application/vnd.google.colaboratory.intrinsic+json":{"type":"dataframe","variable_name":"processed_df","summary":"{\n \"name\": \"processed_df\",\n \"rows\": 1008,\n \"fields\": [\n {\n \"column\": \"prompt\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 1004,\n \"samples\": [\n \"Under which article of LDB are distance education programs developed?\",\n \"For what purpose is the PACC prepared according to Article 22?\",\n \"For what purpose was Resolution Number 064/2011 passed?\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"response\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 998,\n \"samples\": [\n \"Like other non-student affiliated members of the institution, yes, employees also need periodic registry renewal.\",\n \"After preparing the report, it shall be forwarded to the Pro-Rectorate of Undergraduate Studies\",\n \"Eligibility relies on official reports issued by authorized healthcare officials working within the system\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}"}},"metadata":{},"execution_count":4}]},{"cell_type":"markdown","source":["### **Separação dos Dados**\n","\n","Agora, vamos dividir o conjunto de dados em treino e teste, para ser possível avaliar o modelo."],"metadata":{"id":"WtrHTMASkjNl"}},{"cell_type":"code","source":["# Separando os dados em treino e testes com 90% dos danos no treinamento\n","train_df = processed_df.sample(frac=0.9, random_state=42)\n","test_df = processed_df.drop(train_df.index)\n","\n","# Convertendo os dados para o formato .jsonl\n","train_df.to_json('train.jsonl', orient='records', lines=True)\n","test_df.to_json('test.jsonl', orient='records', lines=True)"],"metadata":{"id":"mRfu-r2RnN8K"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["### **Configurações do LORA**\n","Na célula abaixo, definimos as configurações do LORA para fazer o Fine Tunning do modelo TinyLlama. Optamos por escolher um modelo mais simples devido às limitações do Google Colab."],"metadata":{"id":"9eCsGV_kkxoe"}},{"cell_type":"code","source":["model_name = \"TinyLlama/TinyLlama-1.1B-Chat-v1.0\"\n","dataset_name = 'train.jsonl'\n","new_model = \"TinyLlama-1.1B-Chat-v1.0\"\n","\n","lora_r = 64 # rank\n","lora_alpha = 16\n","lora_dropout = 0.1\n","use_4bit = True\n","bnb_4bit_compute_dtype = \"float16\"\n","bnb_4bit_quant_type = \"nf4\"\n","use_nested_quant = False\n","output_dir = \"results\" # diretório em que será salvo\n","num_train_epochs = 3 # épocas do treinamento\n","fp16 = False\n","bf16 = False\n","per_device_train_batch_size = 4\n","per_device_eval_batch_size = 4\n","gradient_accumulation_steps = 1\n","gradient_checkpointing = True\n","max_grad_norm = 0.3\n","learning_rate = 2e-4 # taxa de aprendizado\n","weight_decay = 0.001\n","optim = \"paged_adamw_32bit\"\n","lr_scheduler_type = \"cosine\"\n","max_steps = -1\n","warmup_ratio = 0.03\n","group_by_length = True\n","save_steps = 0\n","logging_steps = 25\n","max_seq_length = None\n","packing = False\n","device_map = {\"\": 0}"],"metadata":{"id":"vFC1a7bUpRH4"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["### **Preparação da base de dados**\n","\n","Agora, preparamos a nossa base de dados para o treino e para a validação. Essa é uma etapa fundamental para que consigamos validar o modelo e não ocorrer o overfitting."],"metadata":{"id":"q5eAn7cKmPLb"}},{"cell_type":"code","source":["train_dataset = load_dataset('json', data_files=f'train.jsonl', split=\"train\")\n","valid_dataset = load_dataset('json', data_files=f'test.jsonl', split=\"train\")"],"metadata":{"id":"JyjJnRzzpmBA","colab":{"base_uri":"https://localhost:8080/","height":81,"referenced_widgets":["d5c5ea1d714841ebaa50471b18921583","49ee874706834cd79b573c8dea02dda0","1945020199f943bfaeb8f3c66d7f7abf","318b3cae62bd40c8a869d1ca685c6e7d","29de997088204f5480c99fc2ce70686d","45a3dcf6739945dfb991f61d98e01a5b","2eb60cbf0e10400bae1b7c0197aa5571","83da63b76d104538bcce2580070be257","2dd818177e634030b2a8e6692ed9f0b7","54f40e972b9c47b09c03d743dce8d723","5432f505af174bf7b93d23829735585f","f47e40310eb74543bdd794c1a7bba21a","ae5a642c07d74b6abd2fd4bdce17b99a","bb68eaad5e7547ecb0f11954fed9cd13","51bceeb2159649dabba7c75353e6b884","2b6334a76ee14c5b8075d3c94bce9ba3","c68a58962b484dde8d97fb29bae77f7a","9b4bc4d8ab0f4e84a7bc9904abb1e4df","51a44c129f45401b992804b835f8d892","342a072b44474941b5740fcfb3b30a84","ce392d2df29d433d842d76b065f294df","9c6cb03133174858b34d8155da9edd34"]},"outputId":"1137f70f-fa2e-4d1e-8d27-d056efeb363d"},"execution_count":null,"outputs":[{"output_type":"display_data","data":{"text/plain":["Generating train split: 0 examples [00:00, ? examples/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"d5c5ea1d714841ebaa50471b18921583"}},"metadata":{}},{"output_type":"display_data","data":{"text/plain":["Generating train split: 0 examples [00:00, ? examples/s]"],"application/vnd.jupyter.widget-view+json":{"version_major":2,"version_minor":0,"model_id":"f47e40310eb74543bdd794c1a7bba21a"}},"metadata":{}}]},{"cell_type":"markdown","source":["Abaixo processamos os dois conjuntos de dados, `train_dataset` e `valid_dataset`, mapeando suas entradas para o novo formato de texto, adequado para o Tiny Llama que utiliza prompts e respostas encapsulados no formato de instrução."],"metadata":{"id":"E25EO5MUnZFq"}},{"cell_type":"code","source":["train_dataset_mapped = train_dataset.map(lambda examples: {'text': [f'[INST] <>\\n\\n<>\\n\\n' + prompt + ' [/INST] ' + response for prompt, response in zip(examples['prompt'], examples['response'])]}, batched=True)\n","valid_dataset_mapped = valid_dataset.map(lambda examples: {'text': [f'[INST] <>\\n\\n<>\\n\\n' + prompt + ' [/INST] ' + response for prompt, response in zip(examples['prompt'], examples['response'])]}, batched=True)"],"metadata":{"id":"tGXfdfp8pqRD","colab":{"base_uri":"https://localhost:8080/","height":81,"referenced_widgets":["6fe73e0cf3904745b9248c334f880c28","c25cbd8181d44a2e8fbdc3b2eb16dc8e","e3187f7f601e4629860aae118c71a632","ab3616254eab47da982534d1c6b39a20","b27bdb7cb1834645bef01185e472ba96","2759c474436f4dbcaac4052f920ca2d9","78ce8a6e9b8b46d0b0b7e1fb79aa634b","72111bbd48fa4d0fab5b504820a99147","4096fa6746f84a7880fd39e63688586a","017ed39c30094ef3afc2ecff578f1ada","f30d048c00e144d59fa646f89daa1f44","ce736d0a74f14af7a6294316ce461d8c","a62fbbad7f364704915f77994a035e7b","c1cef37ac9ad41129c4b7238083f3be6","1f035af160ee418090955908a916680d","f24118bf6102414bafd8536829ef6c72","5cb0ed2cf6f8450ba18124eac9d50c65","d43477b97e244b7c8e0db1804bb66f64","e3107883fe45458c80f04b8d97d590ef","3a345aee1b84453c81ab43c46c9f19e0","a6c6abe3e03e4b159f12ba238cdb9f5b","e51299eb1fe44ab49765533c1ba07213"]},"outputId":"20bb8b54-d464-4c39-c35c-c509f0decb8d"},"execution_count":null,"outputs":[{"output_type":"display_data","data":{"text/plain":["Map: 0%| | 0/907 [00:00"],"text/html":["\n","
\n"," \n"," \n"," [681/681 05:12, Epoch 3/3]\n","
\n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n"," \n","
StepTraining Loss
253.306000
502.150400
751.889600
1001.566900
1251.763500
1501.533900
1751.708100
2001.494000
2251.658700
2501.696700
2751.471800
3001.568200
3251.449200
3501.629500
3751.411000
4001.632000
4251.473900
4501.563500
4751.596500
5001.383300
5251.538500
5501.382700
5751.524500
6001.422500
6251.499200
6501.473400
6751.467500

"]},"metadata":{}},{"output_type":"execute_result","data":{"text/plain":["('TinyLlama-1.1B-Chat-v1.0/tokenizer_config.json',\n"," 'TinyLlama-1.1B-Chat-v1.0/special_tokens_map.json',\n"," 'TinyLlama-1.1B-Chat-v1.0/tokenizer.model',\n"," 'TinyLlama-1.1B-Chat-v1.0/added_tokens.json',\n"," 'TinyLlama-1.1B-Chat-v1.0/tokenizer.json')"]},"metadata":{},"execution_count":14}]},{"cell_type":"code","source":["torch.save(trainer.model.state_dict(), 'model.pt') # salva o modelo em pytorch"],"metadata":{"id":"fbVGW--ayojA"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["### **Teste e Avaliação do modelo**\n","\n","Agora, vamos realizar os testes para conseguir avaliar o quão bem o modelo está conseguindo responder as questões para dados de teste (do dataframe `test_df`).\n","\n","Primeiro, configuramos a **verbosidade** do log para nível crítico, garantindo que apenas mensagens críticas sejam exibidas, o que ajuda a manter a saída do log limpa durante a execução dos testes. Em seguida, configuramos o **pipeline** para geração de texto, definindo os seguintes parâmetros:\n","- Tarefa: geração de texto\n","- Modelo: TinyLlama-1.1B-Chat-v1.0\n","- Tokenizador: AutoTokenizer\n","- Número máximo de novos tokens a serem gerados: 100 tokens"],"metadata":{"id":"YMFg-qgBrjkA"}},{"cell_type":"code","source":["logging.basicConfig(level=logging.CRITICAL)\n","\n","pipe = pipeline(task=\"text-generation\", model=model, tokenizer=tokenizer, max_new_tokens=100)"],"metadata":{"id":"FLc1p2qHpBGW"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["Abaixo definimos uma função chamada `obtem_resposta`, que gera uma resposta para uma pergunta fornecida, utilizando o Tiny Llama, e depois trunca a resposta na primeira quebra de linha. A razão desse truncamento é que o modelo estava gerando múltiplos pares de perguntas e respostas, o que deve ser em virtude a simplicidade do modelo. Por isso, truncamos para obter somente a primeira resposta, referente a pergunta passada para o modelo."],"metadata":{"id":"zOBjzp87r9TQ"}},{"cell_type":"code","source":["def obtem_resposta(question, cont):\n"," system_message = \"You are an assistant specialized in providing clear and precise answers on legal and administrative matters. Answer in a technical and detailed manner. Answer in English.\"\n"," prompt = f\"{system_message}\\n\\n{question}\"\n","\n"," result = pipe(prompt)\n"," print(f\"Gerei a resposta {cont} do Tiny..\")\n","\n"," generated_text = result[0]['generated_text']\n","\n"," prompt_end = prompt.split('\\n\\n')[-1]\n"," if prompt_end in generated_text:\n"," generated_text = generated_text.split(prompt_end, 1)[-1].strip()\n","\n"," truncated_response = generated_text.split('\\n')[0].strip() # truncar\n","\n"," return truncated_response\n","# exemplo de uso\n","# question = \"Quantos dias após a publicação, uma lei levaria para entrar em vigor de acordo com o Artigo 5?\"\n","# answer = obtem_resposta(question)\n","# print(answer)"],"metadata":{"id":"-_MyzXbepFXX"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["A função `avaliar_modelo` abaixo é responsável por avaliar o modelo no conjunto de teste aplicando a função acima, que obtém a resposta do modelo para a pergunta do teste. Ela itera sobre cada linha do dataframe de teste, gerando respostas para as perguntas fornecidas e comparando-as com as respostas esperadas. Os resultados são armazenados em uma lista, que é convertida em um DataFrame e salva em um arquivo CSV. Por fim, o DataFrame de resultados é impresso."],"metadata":{"id":"ymFmYbH6t4do"}},{"cell_type":"code","source":["def avaliar_modelo(test_df):\n"," cont = 1\n"," results = []\n","\n"," for i, row in test_df.iterrows():\n"," question = row['prompt']\n"," expected_answer = row['response']\n"," generated_answer = obtem_resposta(question, cont)\n"," cont += 1\n","\n"," results.append({'prompt': question,\n"," 'resposta_real': expected_answer,\n"," 'resposta_prevista': generated_answer})\n"," # print(f\"Pergunta: {question}\")\n"," # print(f\"Resposta Esperada: {expected_answer}\")\n"," # print(f\"Resposta Gerada: {generated_answer}\")\n"," # print(\"-\" * 50)\n"," # break\n","\n","\n"," results_df = pd.DataFrame(results)\n","\n"," results_df.to_csv('results.csv', index=False, sep='\\t')\n","\n"," print(results_df)\n"," return results_df"],"metadata":{"id":"jGXDvLHAuQXD"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["results_df = avalia_modelo(test_df)"],"metadata":{"id":"L2jVp3PBBeDB","colab":{"base_uri":"https://localhost:8080/"},"outputId":"ef542de0-6f48-4690-b26b-7a0fe125ea56"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Gerei a resposta 1 do Tiny..\n","Gerei a resposta 2 do Tiny..\n","Gerei a resposta 3 do Tiny..\n","Gerei a resposta 4 do Tiny..\n","Gerei a resposta 5 do Tiny..\n","Gerei a resposta 6 do Tiny..\n","Gerei a resposta 7 do Tiny..\n","Gerei a resposta 8 do Tiny..\n","Gerei a resposta 9 do Tiny..\n"]},{"output_type":"stream","name":"stderr","text":["You seem to be using the pipelines sequentially on GPU. In order to maximize efficiency please use a dataset\n"]},{"output_type":"stream","name":"stdout","text":["Gerei a resposta 10 do Tiny..\n","Gerei a resposta 11 do Tiny..\n","Gerei a resposta 12 do Tiny..\n","Gerei a resposta 13 do Tiny..\n","Gerei a resposta 14 do Tiny..\n","Gerei a resposta 15 do Tiny..\n","Gerei a resposta 16 do Tiny..\n","Gerei a resposta 17 do Tiny..\n","Gerei a resposta 18 do Tiny..\n","Gerei a resposta 19 do Tiny..\n","Gerei a resposta 20 do Tiny..\n","Gerei a resposta 21 do Tiny..\n","Gerei a resposta 22 do Tiny..\n","Gerei a resposta 23 do Tiny..\n","Gerei a resposta 24 do Tiny..\n","Gerei a resposta 25 do Tiny..\n","Gerei a resposta 26 do Tiny..\n","Gerei a resposta 27 do Tiny..\n","Gerei a resposta 28 do Tiny..\n","Gerei a resposta 29 do Tiny..\n","Gerei a resposta 30 do Tiny..\n","Gerei a resposta 31 do Tiny..\n","Gerei a resposta 32 do Tiny..\n","Gerei a resposta 33 do Tiny..\n","Gerei a resposta 34 do Tiny..\n","Gerei a resposta 35 do Tiny..\n","Gerei a resposta 36 do Tiny..\n","Gerei a resposta 37 do Tiny..\n","Gerei a resposta 38 do Tiny..\n","Gerei a resposta 39 do Tiny..\n","Gerei a resposta 40 do Tiny..\n","Gerei a resposta 41 do Tiny..\n","Gerei a resposta 42 do Tiny..\n","Gerei a resposta 43 do Tiny..\n","Gerei a resposta 44 do Tiny..\n","Gerei a resposta 45 do Tiny..\n","Gerei a resposta 46 do Tiny..\n","Gerei a resposta 47 do Tiny..\n","Gerei a resposta 48 do Tiny..\n","Gerei a resposta 49 do Tiny..\n","Gerei a resposta 50 do Tiny..\n","Gerei a resposta 51 do Tiny..\n","Gerei a resposta 52 do Tiny..\n","Gerei a resposta 53 do Tiny..\n","Gerei a resposta 54 do Tiny..\n","Gerei a resposta 55 do Tiny..\n","Gerei a resposta 56 do Tiny..\n","Gerei a resposta 57 do Tiny..\n","Gerei a resposta 58 do Tiny..\n","Gerei a resposta 59 do Tiny..\n","Gerei a resposta 60 do Tiny..\n","Gerei a resposta 61 do Tiny..\n","Gerei a resposta 62 do Tiny..\n","Gerei a resposta 63 do Tiny..\n","Gerei a resposta 64 do Tiny..\n","Gerei a resposta 65 do Tiny..\n","Gerei a resposta 66 do Tiny..\n","Gerei a resposta 67 do Tiny..\n","Gerei a resposta 68 do Tiny..\n","Gerei a resposta 69 do Tiny..\n","Gerei a resposta 70 do Tiny..\n","Gerei a resposta 71 do Tiny..\n","Gerei a resposta 72 do Tiny..\n","Gerei a resposta 73 do Tiny..\n","Gerei a resposta 74 do Tiny..\n","Gerei a resposta 75 do Tiny..\n","Gerei a resposta 76 do Tiny..\n","Gerei a resposta 77 do Tiny..\n","Gerei a resposta 78 do Tiny..\n","Gerei a resposta 79 do Tiny..\n","Gerei a resposta 80 do Tiny..\n","Gerei a resposta 81 do Tiny..\n","Gerei a resposta 82 do Tiny..\n","Gerei a resposta 83 do Tiny..\n","Gerei a resposta 84 do Tiny..\n","Gerei a resposta 85 do Tiny..\n","Gerei a resposta 86 do Tiny..\n","Gerei a resposta 87 do Tiny..\n","Gerei a resposta 88 do Tiny..\n","Gerei a resposta 89 do Tiny..\n","Gerei a resposta 90 do Tiny..\n","Gerei a resposta 91 do Tiny..\n","Gerei a resposta 92 do Tiny..\n","Gerei a resposta 93 do Tiny..\n","Gerei a resposta 94 do Tiny..\n","Gerei a resposta 95 do Tiny..\n","Gerei a resposta 96 do Tiny..\n","Gerei a resposta 97 do Tiny..\n","Gerei a resposta 98 do Tiny..\n","Gerei a resposta 99 do Tiny..\n","Gerei a resposta 100 do Tiny..\n","Gerei a resposta 101 do Tiny..\n"," prompt \\\n","0 How many days after publication would it take ... \n","1 May i know whom publicly issued interpertation... \n","2 Does the act specify who has authority over gr... \n","3 Are field assignments subject to application f... \n","4 Can a university issue a degree with specific ... \n",".. ... \n","96 When did Resolution Nº 027/2010-CEG come into ... \n","97 In what circumstances would a student receive ... \n","98 Are only Brazilian institutions considered eli... \n","99 Will students automatically receive full credi... \n","100 Where will requests for accreditation from ins... \n","\n"," resposta_real \\\n","0 This law becomes effective thirty days from it... \n","1 The listed government officials authored rule ... \n","2 Granting falls upon coordinators' duties with ... \n","3 Field works aren't explicitly mentioned being ... \n","4 No, they cannot. According to the response fro... \n",".. ... \n","96 Resolution Nº 027/2010-CEG came into effect on... \n","97 A student who registered but wasn't selected b... \n","98 Foreign higher education institutions may also... \n","99 Meeting the minimal percentage thresholds alon... \n","100 Requests for accreditation from institutions w... \n","\n"," resposta_prevista \n","0 Answer according to: Article 5: This law shall... \n","1 Sure, the publicly issued interpertation guida... \n","2 Answer according to… The act specifies that th... \n","3 Yes, field assignments are subject to applicat... \n","4 Yes, a university can issue a degree with spec... \n",".. ... \n","96 Resolution Nº 027/2010-CEG came into effect on... \n","97 A student receives a mention of 'dispensed' in... \n","98 No, any institution recognized by the Brazilia... \n","99 No, credit will only be awarded if the student... \n","100 In the Ministry of Education's office in the c... \n","\n","[101 rows x 3 columns]\n"]}]},{"cell_type":"code","source":["test_question = \"Whats is UFAM?\"\n","answer = obtem_resposta(test_question, 1)\n","print(answer)"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"jZ-0I6qmiaPW","outputId":"5c840ac3-9271-49e2-ddcc-9ab2e0a9a753"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Gerei a resposta 1 do Tiny..\n","What is its mission? Provide a brief overview of its activities and objectives.\n"]}]},{"cell_type":"code","source":["# salvando no csv\n","results_df.to_csv('results_LORA.csv', index=False, sep='\\t')\n","\n","print(results_df)"],"metadata":{"id":"_VdzTF6lL0Fa","colab":{"base_uri":"https://localhost:8080/"},"outputId":"7ea890b5-ef92-4513-dfcf-78a065b69557"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":[" prompt \\\n","0 How many days after publication would it take ... \n","1 May i know whom publicly issued interpertation... \n","2 Does the act specify who has authority over gr... \n","3 Are field assignments subject to application f... \n","4 Can a university issue a degree with specific ... \n",".. ... \n","96 When did Resolution Nº 027/2010-CEG come into ... \n","97 In what circumstances would a student receive ... \n","98 Are only Brazilian institutions considered eli... \n","99 Will students automatically receive full credi... \n","100 Where will requests for accreditation from ins... \n","\n"," resposta_real \\\n","0 This law becomes effective thirty days from it... \n","1 The listed government officials authored rule ... \n","2 Granting falls upon coordinators' duties with ... \n","3 Field works aren't explicitly mentioned being ... \n","4 No, they cannot. According to the response fro... \n",".. ... \n","96 Resolution Nº 027/2010-CEG came into effect on... \n","97 A student who registered but wasn't selected b... \n","98 Foreign higher education institutions may also... \n","99 Meeting the minimal percentage thresholds alon... \n","100 Requests for accreditation from institutions w... \n","\n"," resposta_prevista \n","0 Answer according to: Article 5: This law shall... \n","1 Sure, the publicly issued interpertation guida... \n","2 Answer according to… The act specifies that th... \n","3 Yes, field assignments are subject to applicat... \n","4 Yes, a university can issue a degree with spec... \n",".. ... \n","96 Resolution Nº 027/2010-CEG came into effect on... \n","97 A student receives a mention of 'dispensed' in... \n","98 No, any institution recognized by the Brazilia... \n","99 No, credit will only be awarded if the student... \n","100 In the Ministry of Education's office in the c... \n","\n","[101 rows x 3 columns]\n"]}]},{"cell_type":"code","source":["results_df['resposta_prevista']"],"metadata":{"id":"UL9zyqoiSk8h","colab":{"base_uri":"https://localhost:8080/"},"outputId":"61c00ee7-d541-4f2d-80b7-35805614ce76"},"execution_count":null,"outputs":[{"output_type":"execute_result","data":{"text/plain":["0 Answer according to: Article 5: This law shall...\n","1 Sure, the publicly issued interpertation guida...\n","2 Answer according to… The act specifies that th...\n","3 Yes, field assignments are subject to applicat...\n","4 Yes, a university can issue a degree with spec...\n"," ... \n","96 Resolution Nº 027/2010-CEG came into effect on...\n","97 A student receives a mention of 'dispensed' in...\n","98 No, any institution recognized by the Brazilia...\n","99 No, credit will only be awarded if the student...\n","100 In the Ministry of Education's office in the c...\n","Name: resposta_prevista, Length: 101, dtype: object"]},"metadata":{},"execution_count":29}]},{"cell_type":"markdown","source":["### **Similaridade do Cosseno**\n","\n","Para avaliar o quão próximas estão as respostas do modelo Tiny Llama com LORA em relação às respostas reais da base de dados sintética, vamos usar a similaridade do cosseno. Para fazer isso, vamos usar o **modelo de linguagem SentenceTransformer com o modelo all-mpnet-base-v2**, que permite **criar embeddings** das palavras para calcular a similaridade do cosseno. Essa métrica é fundamental para **medir a similaridade entre duas sequências de texto**, transformando-as em vetores e calculando o cosseno do ângulo entre eles. A similaridade do cosseno varia de -1 a 1, onde 1 indica uma correspondência perfeita, 0 indica que não há relação e -1 indica que são completamente opostas.\n","\n","No contexto do nosso modelo Tiny Llama com LORA, a similaridade do cosseno vai nos ajudar a quantificar a precisão e relevância das respostas geradas, oferecendo uma medida de desempenho que vai nos guiar a possíveis melhorias que podem ser feitas no modelo.\n","\n","Para realizar essa avaliação, seguimos os seguintes passos:\n","\n","- **Carregar o modelo de embeddings**: Utilizamos o SentenceTransformer para transformar frases em vetores numéricos.\n","- **Processar os dados**: Carregamos o arquivo csv com as respostas reais e previstas que criamos anteriormente.\n","- **Calcular a similaridade**: Para cada par de respostas (real e prevista), calculamos a similaridade do cosseno e adicionamos essa informação ao dataframe.\n","- **Analisar os resultados**: Calculamos a média das similaridades para obter uma visão geral do desempenho do modelo."],"metadata":{"id":"9ijJaTl4vAFL"}},{"cell_type":"markdown","source":["Vamos ver abaixo alguns exemplos do cálculo da similaridade do cosseno para algumas respostas reais e previstas do dataframe que acabamos de criar."],"metadata":{"id":"5zQybIfp2EyU"}},{"cell_type":"code","source":["# carregando o modelo\n","model = SentenceTransformer('all-mpnet-base-v2')"],"metadata":{"id":"q41gNixh4Iot"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# exemplo 1\n","real = \"Yes, Deaf individuals receive priority admission into courses related to Libras instruction and formation\"\n","prevista = \"Yes, Deaf individuals have priority access to certain courses offered by the university\"\n","\n","# criação dos embeddings\n","embedding1 = model.encode(real, convert_to_tensor=True)\n","embedding2 = model.encode(prevista, convert_to_tensor=True)\n","\n","# cálculo da similaridade do cosseno\n","cosine_similarity = util.pytorch_cos_sim(embedding1, embedding2)\n","\n","print(\"Similaridade de Cosseno:\", cosine_similarity.item())"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"6vLAmO4b0dkR","executionInfo":{"status":"ok","timestamp":1722949998576,"user_tz":180,"elapsed":621,"user":{"displayName":"Bianka Vasconcelos","userId":"00512411367206176161"}},"outputId":"d9f4e572-5d53-4a2f-d61c-d8bebc14b5c9"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Similaridade de Cosseno: 0.8298245668411255\n"]}]},{"cell_type":"code","source":["# exemplo 2\n","real = \"Yes, being an author or co-author of a chapter in a book is recognized as a complementary activity according to Art. 4 Item IV.\"\n","prevista = \"Yes, authors or co-authors of published book chapters are eligible for recognition as complementary activities.\"\n","\n","# criação dos embeddings\n","embedding1 = model.encode(real, convert_to_tensor=True)\n","embedding2 = model.encode(prevista, convert_to_tensor=True)\n","\n","# cálculo da similaridade do cosseno\n","cosine_similarity = util.pytorch_cos_sim(embedding1, embedding2)\n","\n","print(\"Similaridade de Cosseno:\", cosine_similarity.item())"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"ozXzJTHW1fEW","executionInfo":{"status":"ok","timestamp":1722950249109,"user_tz":180,"elapsed":523,"user":{"displayName":"Bianka Vasconcelos","userId":"00512411367206176161"}},"outputId":"a0e026f6-527f-4c96-d543-70a775005311"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Similaridade de Cosseno: 0.832678496837616\n"]}]},{"cell_type":"code","source":["# exemplo 3\n","real = \"To ensure consistency in integrating undergraduate courses taken by students across different departments.\"\n","prevista = \"Because it is necessary to ensure the proper functioning of the system of higher education in the country.\"\n","\n","# criação dos embeddings\n","embedding1 = model.encode(real, convert_to_tensor=True)\n","embedding2 = model.encode(prevista, convert_to_tensor=True)\n","\n","# cálculo da similaridade do cosseno\n","cosine_similarity = util.pytorch_cos_sim(embedding1, embedding2)\n","\n","print(\"Similaridade de Cosseno:\", cosine_similarity.item())"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"c199_Tg22MtU","executionInfo":{"status":"ok","timestamp":1722950556771,"user_tz":180,"elapsed":514,"user":{"displayName":"Bianka Vasconcelos","userId":"00512411367206176161"}},"outputId":"83ad0458-8b89-4e46-aa96-e42c6f51c814"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Similaridade de Cosseno: 0.5239999294281006\n"]}]},{"cell_type":"markdown","source":["Agora, vamos aplicar a similaridade do cosseno para todas as respostas reais e previstas do dataframe."],"metadata":{"id":"OIMrRUq92y8R"}},{"cell_type":"code","source":["# carregando o csv\n","df = pd.read_csv('results.csv', sep='\\t')\n","\n","# alguns valores o modelo não conseguiu prever, então filtramos as colunas vazias\n","df['resposta_real'] = df['resposta_real'].fillna('')\n","df['resposta_prevista'] = df['resposta_prevista'].fillna('')\n","\n","# Função para calcular a similaridade do cosseno\n","def calcular_similaridade(row):\n"," frase1 = str(row['resposta_real'])\n"," frase2 = str(row['resposta_prevista'])\n","\n"," # Obter embeddings das frases\n"," embedding1 = model.encode(frase1, convert_to_tensor=True)\n"," embedding2 = model.encode(frase2, convert_to_tensor=True)\n","\n"," # Calcular similaridade do cosseno\n"," similaridade = util.pytorch_cos_sim(embedding1, embedding2).item()\n"," return similaridade"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"ZDjvP8PDsv32","executionInfo":{"status":"ok","timestamp":1722948256291,"user_tz":180,"elapsed":5291,"user":{"displayName":"Bianka Vasconcelos","userId":"00512411367206176161"}},"outputId":"f4a8edae-b40d-4f92-aa6b-887d3d7953ff"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stderr","text":["/usr/local/lib/python3.10/dist-packages/huggingface_hub/utils/_token.py:89: UserWarning: \n","The secret `HF_TOKEN` does not exist in your Colab secrets.\n","To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n","You will be able to reuse this secret in all of your notebooks.\n","Please note that authentication is recommended but still optional to access public models or datasets.\n"," warnings.warn(\n"]}]},{"cell_type":"code","source":["# aplicar em cada linha do df\n","df['similaridade_cosseno'] = df.apply(calcular_similaridade, axis=1)\n","\n","# média da similaridade do cosseno\n","media_similaridade = df['similaridade_cosseno'].mean()\n","\n","# salva no df\n","df.to_csv('resultados_com_similaridade.csv', sep='\\t', index=False)\n","\n","# mostra o df\n","print(df[['resposta_real', 'resposta_prevista', 'similaridade_cosseno']])"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"IYXpr6APpK7X","executionInfo":{"status":"ok","timestamp":1722948309931,"user_tz":180,"elapsed":8734,"user":{"displayName":"Bianka Vasconcelos","userId":"00512411367206176161"}},"outputId":"b49e0c8d-39cb-45ae-c98f-be2793dd6486"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":[" resposta_real \\\n","0 This law becomes effective thirty days from it... \n","1 The listed government officials authored rule ... \n","2 Granting falls upon coordinators' duties with ... \n","3 Field works aren't explicitly mentioned being ... \n","4 No, they cannot. According to the response fro... \n",".. ... \n","96 Resolution Nº 027/2010-CEG came into effect on... \n","97 A student who registered but wasn't selected b... \n","98 Foreign higher education institutions may also... \n","99 Meeting the minimal percentage thresholds alon... \n","100 Requests for accreditation from institutions w... \n","\n"," resposta_prevista similaridade_cosseno \n","0 Answer according to: Article 5: This law shall... 0.754316 \n","1 Sure, the publicly issued interpertation guida... 0.540074 \n","2 Answer according to… The act specifies that th... 0.422281 \n","3 Yes, field assignments are subject to applicat... 0.456716 \n","4 Yes, a university can issue a degree with spec... 0.553797 \n",".. ... ... \n","96 Resolution Nº 027/2010-CEG came into effect on... 0.943615 \n","97 A student receives a mention of 'dispensed' in... 0.751552 \n","98 No, any institution recognized by the Brazilia... 0.455082 \n","99 No, credit will only be awarded if the student... 0.250302 \n","100 In the Ministry of Education's office in the c... 0.451453 \n","\n","[101 rows x 3 columns]\n"]}]},{"cell_type":"code","source":["print(f'Média da similaridade do cosseno: {media_similaridade}')"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"QaHu_H-3tZ3b","executionInfo":{"status":"ok","timestamp":1722948321410,"user_tz":180,"elapsed":501,"user":{"displayName":"Bianka Vasconcelos","userId":"00512411367206176161"}},"outputId":"ae59dafc-43e4-4c56-f7fa-a5a31f35378a"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Média da similaridade do cosseno: 0.4656926949720572\n"]}]},{"cell_type":"markdown","source":["Como podemos observar, o valor médio da similaridade do cosseno foi, de 0.46, o que sugere que há um grau de similaridade entre as frases reais e previstas, mas elas **não são totalmente semelhantes**. Isso significa que, apesar de o modelo trazer resultados diferentes, ele consegue identificar a essência contextual da pergunta.\n","\n","Possíveis melhorias para aumentar a similaridade do cosseno seria realizar o Fine Tuning com LORA em um modelo melhor, o que exigiria mais desempenho do ambiente de execução. Outra solução é aumentar a quantidade de exemplos da base de dados sintética de instruções, visando dar mais contexto para ser mais fácil para o modelo conseguir generalizar."],"metadata":{"id":"JFnCNV-2tVAk"}}]}