diff --git "a/colab_training_code.ipynb" "b/colab_training_code.ipynb" new file mode 100644--- /dev/null +++ "b/colab_training_code.ipynb" @@ -0,0 +1,2634 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [], + "gpuType": "T4" + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + }, + "accelerator": "GPU", + "widgets": { + "application/vnd.jupyter.widget-state+json": { + "749ba51491c044ca889995dfc29aefbe": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HBoxModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HBoxModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HBoxView", + "box_style": "", + "children": [ + "IPY_MODEL_6ca7365936d54911bc1400728b2530cd", + "IPY_MODEL_3e081a2f5c43489cac3f946805481b51", + "IPY_MODEL_304e1cc3bbfc4dc3bb8cb632d1bd56f6" + ], + "layout": "IPY_MODEL_4f93c4ea8e2348e0aa01fca1c47a49a5" + } + }, + "6ca7365936d54911bc1400728b2530cd": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_57a45c09a4734f06bcee2b0ee323b2fe", + "placeholder": "​", + "style": "IPY_MODEL_f91722446f084d7e9d8931d47916b578", + "value": "tokenizer_config.json: 100%" + } + }, + "3e081a2f5c43489cac3f946805481b51": { + "model_module": "@jupyter-widgets/controls", + "model_name": "FloatProgressModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "FloatProgressModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "ProgressView", + "bar_style": "success", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_655c6661d48547168c5d31e5e6dc1dd2", + "max": 1358, + "min": 0, + "orientation": "horizontal", + "style": "IPY_MODEL_53192790cbb04e7f91656367c6662c95", + "value": 1358 + } + }, + "304e1cc3bbfc4dc3bb8cb632d1bd56f6": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_7e6f575a76974a2e922c76cb38f49091", + "placeholder": "​", + "style": "IPY_MODEL_1161d252ff7f447faab84c900d517094", + "value": " 1.36k/1.36k [00:00<00:00, 143kB/s]" + } + }, + "4f93c4ea8e2348e0aa01fca1c47a49a5": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "57a45c09a4734f06bcee2b0ee323b2fe": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "f91722446f084d7e9d8931d47916b578": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "655c6661d48547168c5d31e5e6dc1dd2": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "53192790cbb04e7f91656367c6662c95": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "ProgressStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "bar_color": null, + "description_width": "" + } + }, + "7e6f575a76974a2e922c76cb38f49091": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "1161d252ff7f447faab84c900d517094": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "1891eebf624d447eb97f4d776768bf78": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HBoxModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HBoxModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HBoxView", + "box_style": "", + "children": [ + "IPY_MODEL_0fec18fdbb1c409d94138ef1a36552d6", + "IPY_MODEL_bd1f0fec3a1943f28ce011efc23c8917", + "IPY_MODEL_2540139421bc4b8fb2b9bf08d5892ef5" + ], + "layout": "IPY_MODEL_4d047da57c934721bce6d7ad1713eac6" + } + }, + "0fec18fdbb1c409d94138ef1a36552d6": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_54380f4cdee44342af0ed98222b4535a", + "placeholder": "​", + "style": "IPY_MODEL_7366beb4e89849dd840938f92559a781", + "value": "vocab.txt: 100%" + } + }, + "bd1f0fec3a1943f28ce011efc23c8917": { + "model_module": "@jupyter-widgets/controls", + "model_name": "FloatProgressModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "FloatProgressModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "ProgressView", + "bar_style": "success", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_4b84171b90a34458bbd53c4eaf4622bf", + "max": 231508, + "min": 0, + "orientation": "horizontal", + "style": "IPY_MODEL_661a10fe1a154cd3b148766107f20799", + "value": 231508 + } + }, + "2540139421bc4b8fb2b9bf08d5892ef5": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_2e1fc1da15dd4e089bdcbfefd95a62f2", + "placeholder": "​", + "style": "IPY_MODEL_4175abfad0b8436faeaac53da1965c02", + "value": " 232k/232k [00:00<00:00, 11.6MB/s]" + } + }, + "4d047da57c934721bce6d7ad1713eac6": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "54380f4cdee44342af0ed98222b4535a": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "7366beb4e89849dd840938f92559a781": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "4b84171b90a34458bbd53c4eaf4622bf": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "661a10fe1a154cd3b148766107f20799": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "ProgressStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "bar_color": null, + "description_width": "" + } + }, + "2e1fc1da15dd4e089bdcbfefd95a62f2": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "4175abfad0b8436faeaac53da1965c02": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "9fa910ebbeed4b88b1156b4acea65823": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HBoxModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HBoxModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HBoxView", + "box_style": "", + "children": [ + "IPY_MODEL_ba4186a2772a479f80c10cda310ce419", + "IPY_MODEL_a358c80812ee4569917bf4c50f26a455", + "IPY_MODEL_52322d1069324122a44b00847129eadc" + ], + "layout": "IPY_MODEL_4fac203df0094a2cabf8b87a4345c31a" + } + }, + "ba4186a2772a479f80c10cda310ce419": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_3b833d45ac494796a9eb73eda8958a1a", + "placeholder": "​", + "style": "IPY_MODEL_c2881b79f4ed489c9b251799e36428ef", + "value": "special_tokens_map.json: 100%" + } + }, + "a358c80812ee4569917bf4c50f26a455": { + "model_module": "@jupyter-widgets/controls", + "model_name": "FloatProgressModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "FloatProgressModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "ProgressView", + "bar_style": "success", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_41e42912744a460dabbe8845738d6392", + "max": 132, + "min": 0, + "orientation": "horizontal", + "style": "IPY_MODEL_c7f44a97c9ec4007bd5f5f58a6545d15", + "value": 132 + } + }, + "52322d1069324122a44b00847129eadc": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_f25ebd939a734bf9abc47a0a05d328a7", + "placeholder": "​", + "style": "IPY_MODEL_48d4116634ce43cb9d85441b2812c2e2", + "value": " 132/132 [00:00<00:00, 12.8kB/s]" + } + }, + "4fac203df0094a2cabf8b87a4345c31a": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "3b833d45ac494796a9eb73eda8958a1a": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "c2881b79f4ed489c9b251799e36428ef": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "41e42912744a460dabbe8845738d6392": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "c7f44a97c9ec4007bd5f5f58a6545d15": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "ProgressStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "bar_color": null, + "description_width": "" + } + }, + "f25ebd939a734bf9abc47a0a05d328a7": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "48d4116634ce43cb9d85441b2812c2e2": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "db4a5dbf7dde43aa93b960a7e4163460": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HBoxModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HBoxModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HBoxView", + "box_style": "", + "children": [ + "IPY_MODEL_d60ed5eb992f4d4fa2110801253ccb31", + "IPY_MODEL_18ae0aa234b146449cb4fbf034f264c5", + "IPY_MODEL_b067bc80e9f24813a3bce37010f564eb" + ], + "layout": "IPY_MODEL_488ab30966684580bce5c7408c3cafa2" + } + }, + "d60ed5eb992f4d4fa2110801253ccb31": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_0890c9d3a93f4a70b593b4ccce4ad146", + "placeholder": "​", + "style": "IPY_MODEL_64b7afb7f2db4009ae65bc55d86055a5", + "value": "tokenizer.json: 100%" + } + }, + "18ae0aa234b146449cb4fbf034f264c5": { + "model_module": "@jupyter-widgets/controls", + "model_name": "FloatProgressModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "FloatProgressModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "ProgressView", + "bar_style": "success", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_01b3d7b2152944f78c240ff9636545c1", + "max": 711396, + "min": 0, + "orientation": "horizontal", + "style": "IPY_MODEL_6efa68aae0224aecb1b1f8e82449e95e", + "value": 711396 + } + }, + "b067bc80e9f24813a3bce37010f564eb": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_7012266bc09f4818a126c4b7ca1617f6", + "placeholder": "​", + "style": "IPY_MODEL_f127fefb404644668df0ec361cb5a40e", + "value": " 711k/711k [00:00<00:00, 3.15MB/s]" + } + }, + "488ab30966684580bce5c7408c3cafa2": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "0890c9d3a93f4a70b593b4ccce4ad146": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "64b7afb7f2db4009ae65bc55d86055a5": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "01b3d7b2152944f78c240ff9636545c1": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "6efa68aae0224aecb1b1f8e82449e95e": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "ProgressStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "bar_color": null, + "description_width": "" + } + }, + "7012266bc09f4818a126c4b7ca1617f6": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "f127fefb404644668df0ec361cb5a40e": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "2f93d88de31240a18572733ad9b19b0a": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HBoxModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HBoxModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HBoxView", + "box_style": "", + "children": [ + "IPY_MODEL_5726e4d9459e40e98478c28f93d64d09", + "IPY_MODEL_0f955020aad445a0bb553c54c636f19a", + "IPY_MODEL_beb2dd2c6aa64a8dbeade4bec58f7830" + ], + "layout": "IPY_MODEL_f0f1b559aafe406799a47e71ad6deda7" + } + }, + "5726e4d9459e40e98478c28f93d64d09": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_c44a08ff9b7546cf81a14ffe4ee703cf", + "placeholder": "​", + "style": "IPY_MODEL_3b6ee751319a49dcb275e816a612e722", + "value": "config.json: 100%" + } + }, + "0f955020aad445a0bb553c54c636f19a": { + "model_module": "@jupyter-widgets/controls", + "model_name": "FloatProgressModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "FloatProgressModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "ProgressView", + "bar_style": "success", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_bcc2f99fd28449db931c0ce90ff8393e", + "max": 611, + "min": 0, + "orientation": "horizontal", + "style": "IPY_MODEL_152f1f42c5064a78b643238b5fa49f44", + "value": 611 + } + }, + "beb2dd2c6aa64a8dbeade4bec58f7830": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_93da545cacf34914b40974da5141c5bf", + "placeholder": "​", + "style": "IPY_MODEL_8ada43f54bbd46edbfffe794e0a7fcce", + "value": " 611/611 [00:00<00:00, 75.4kB/s]" + } + }, + "f0f1b559aafe406799a47e71ad6deda7": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "c44a08ff9b7546cf81a14ffe4ee703cf": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "3b6ee751319a49dcb275e816a612e722": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "bcc2f99fd28449db931c0ce90ff8393e": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "152f1f42c5064a78b643238b5fa49f44": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "ProgressStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "bar_color": null, + "description_width": "" + } + }, + "93da545cacf34914b40974da5141c5bf": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "8ada43f54bbd46edbfffe794e0a7fcce": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "e5429e28049b4a49ab57e15f314bc5ea": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HBoxModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HBoxModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HBoxView", + "box_style": "", + "children": [ + "IPY_MODEL_5bb309dbd988464a9b2fc097d4886cbf", + "IPY_MODEL_90430903678e42b4bdbe415959002ef2", + "IPY_MODEL_e5199abc50b1496a983908031be4b067" + ], + "layout": "IPY_MODEL_ce964572b09c4f70a2e87c807a90dece" + } + }, + "5bb309dbd988464a9b2fc097d4886cbf": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_890ef9a5c3d64009b10a8aeefb5a65f3", + "placeholder": "​", + "style": "IPY_MODEL_e50773e905314335997c834c0b3625a0", + "value": "model.safetensors: 100%" + } + }, + "90430903678e42b4bdbe415959002ef2": { + "model_module": "@jupyter-widgets/controls", + "model_name": "FloatProgressModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "FloatProgressModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "ProgressView", + "bar_style": "success", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_7b5feb5a79744533877c3e9db5ce69a3", + "max": 57458416, + "min": 0, + "orientation": "horizontal", + "style": "IPY_MODEL_ba95c521730b481fa4fb3c0f3149e199", + "value": 57458416 + } + }, + "e5199abc50b1496a983908031be4b067": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_add8d4b00c3b45c8aeab74a583dccf5c", + "placeholder": "​", + "style": "IPY_MODEL_80ed97a8635243c4b2ea5bec7183ad68", + "value": " 57.5M/57.5M [00:00<00:00, 199MB/s]" + } + }, + "ce964572b09c4f70a2e87c807a90dece": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "890ef9a5c3d64009b10a8aeefb5a65f3": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "e50773e905314335997c834c0b3625a0": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "7b5feb5a79744533877c3e9db5ce69a3": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "ba95c521730b481fa4fb3c0f3149e199": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "ProgressStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "bar_color": null, + "description_width": "" + } + }, + "add8d4b00c3b45c8aeab74a583dccf5c": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "80ed97a8635243c4b2ea5bec7183ad68": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + } + } + } + }, + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 967, + "referenced_widgets": [ + "749ba51491c044ca889995dfc29aefbe", + "6ca7365936d54911bc1400728b2530cd", + "3e081a2f5c43489cac3f946805481b51", + "304e1cc3bbfc4dc3bb8cb632d1bd56f6", + "4f93c4ea8e2348e0aa01fca1c47a49a5", + "57a45c09a4734f06bcee2b0ee323b2fe", + "f91722446f084d7e9d8931d47916b578", + "655c6661d48547168c5d31e5e6dc1dd2", + "53192790cbb04e7f91656367c6662c95", + "7e6f575a76974a2e922c76cb38f49091", + "1161d252ff7f447faab84c900d517094", + "1891eebf624d447eb97f4d776768bf78", + "0fec18fdbb1c409d94138ef1a36552d6", + "bd1f0fec3a1943f28ce011efc23c8917", + "2540139421bc4b8fb2b9bf08d5892ef5", + "4d047da57c934721bce6d7ad1713eac6", + "54380f4cdee44342af0ed98222b4535a", + "7366beb4e89849dd840938f92559a781", + "4b84171b90a34458bbd53c4eaf4622bf", + "661a10fe1a154cd3b148766107f20799", + "2e1fc1da15dd4e089bdcbfefd95a62f2", + "4175abfad0b8436faeaac53da1965c02", + "9fa910ebbeed4b88b1156b4acea65823", + "ba4186a2772a479f80c10cda310ce419", + "a358c80812ee4569917bf4c50f26a455", + "52322d1069324122a44b00847129eadc", + "4fac203df0094a2cabf8b87a4345c31a", + "3b833d45ac494796a9eb73eda8958a1a", + "c2881b79f4ed489c9b251799e36428ef", + "41e42912744a460dabbe8845738d6392", + "c7f44a97c9ec4007bd5f5f58a6545d15", + "f25ebd939a734bf9abc47a0a05d328a7", + "48d4116634ce43cb9d85441b2812c2e2", + "db4a5dbf7dde43aa93b960a7e4163460", + "d60ed5eb992f4d4fa2110801253ccb31", + "18ae0aa234b146449cb4fbf034f264c5", + "b067bc80e9f24813a3bce37010f564eb", + "488ab30966684580bce5c7408c3cafa2", + "0890c9d3a93f4a70b593b4ccce4ad146", + "64b7afb7f2db4009ae65bc55d86055a5", + "01b3d7b2152944f78c240ff9636545c1", + "6efa68aae0224aecb1b1f8e82449e95e", + "7012266bc09f4818a126c4b7ca1617f6", + "f127fefb404644668df0ec361cb5a40e", + "2f93d88de31240a18572733ad9b19b0a", + "5726e4d9459e40e98478c28f93d64d09", + "0f955020aad445a0bb553c54c636f19a", + "beb2dd2c6aa64a8dbeade4bec58f7830", + "f0f1b559aafe406799a47e71ad6deda7", + "c44a08ff9b7546cf81a14ffe4ee703cf", + "3b6ee751319a49dcb275e816a612e722", + "bcc2f99fd28449db931c0ce90ff8393e", + "152f1f42c5064a78b643238b5fa49f44", + "93da545cacf34914b40974da5141c5bf", + "8ada43f54bbd46edbfffe794e0a7fcce", + "e5429e28049b4a49ab57e15f314bc5ea", + "5bb309dbd988464a9b2fc097d4886cbf", + "90430903678e42b4bdbe415959002ef2", + "e5199abc50b1496a983908031be4b067", + "ce964572b09c4f70a2e87c807a90dece", + "890ef9a5c3d64009b10a8aeefb5a65f3", + "e50773e905314335997c834c0b3625a0", + "7b5feb5a79744533877c3e9db5ce69a3", + "ba95c521730b481fa4fb3c0f3149e199", + "add8d4b00c3b45c8aeab74a583dccf5c", + "80ed97a8635243c4b2ea5bec7183ad68" + ] + }, + "id": "HsmRaw4gb7cY", + "outputId": "e222cb11-111c-401a-d877-9e46f1a2f4cd" + }, + "outputs": [ + { + "output_type": "stream", + "name": "stderr", + "text": [ + "/usr/local/lib/python3.11/dist-packages/huggingface_hub/utils/_auth.py:94: UserWarning: \n", + "The secret `HF_TOKEN` does not exist in your Colab secrets.\n", + "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n", + "You will be able to reuse this secret in all of your notebooks.\n", + "Please note that authentication is recommended but still optional to access public models or datasets.\n", + " warnings.warn(\n" + ] + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + "tokenizer_config.json: 0%| | 0.00/1.36k [00:00" + ], + "text/html": [ + "\n", + "
\n", + " \n", + " \n", + " [152460/152460 2:12:35, Epoch 5/5]\n", + "
\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
EpochTraining LossValidation LossAccuracyF1 Weighted
10.1739000.1826930.9535620.953709
20.2205000.1532530.9619570.961822
30.0578000.1251740.9695990.969571
40.0856000.1180670.9724270.972436
50.0354000.1150790.9736320.973634

" + ] + }, + "metadata": {} + }, + { + "output_type": "stream", + "name": "stderr", + "text": [ + "Training: 100%|██████████| 152460/152460 [2:12:36<00:00, 19.16step/s, epoch=5.00, step=152460]\n" + ] + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + "" + ], + "text/html": [ + "\n", + "

\n", + " \n", + " \n", + " [7623/7623 02:13]\n", + "
\n", + " " + ] + }, + "metadata": {} + }, + { + "output_type": "stream", + "name": "stdout", + "text": [ + "✅ Training complete. Model and tokenizer saved to ./neuro-nearby\n", + "✅ Model directory zipped to neuro-nearby.zip\n", + "\n", + "Running test cases...\n", + "\n", + "Test Cases Accuracy: 100.00% (6/6 correct)\n", + "✓ 'Where is the nearest airport to this location?'\n", + " Expected: airport, Predicted: airport, Confidence: 1.000\n", + "✓ 'Can I bring a laptop through airport security?'\n", + " Expected: airport, Predicted: airport, Confidence: 1.000\n", + "✓ 'How do I get to the closest airport terminal?'\n", + " Expected: airport, Predicted: airport, Confidence: 1.000\n", + "✓ 'Need help finding an accounting firm for tax planning.'\n", + " Expected: accounting firm, Predicted: accounting firm, Confidence: 1.000\n", + "✓ 'Can an accounting firm help with financial audits?'\n", + " Expected: accounting firm, Predicted: accounting firm, Confidence: 1.000\n", + "✓ 'Looking for an accounting firm to manage payroll.'\n", + " Expected: accounting firm, Predicted: accounting firm, Confidence: 1.000\n", + "✅ Test cases completed.\n" + ] + } + ], + "source": [ + "import pandas as pd\n", + "from transformers import BertTokenizer, BertForSequenceClassification, Trainer, TrainingArguments, TrainerCallback\n", + "from sklearn.model_selection import train_test_split\n", + "from sklearn.metrics import accuracy_score, f1_score\n", + "import torch\n", + "from torch.utils.data import Dataset\n", + "import shutil\n", + "from tqdm import tqdm\n", + "import numpy as np\n", + "\n", + "# === 0. Define model and output paths ===\n", + "MODEL_NAME = \"boltuix/NeuroBERT\"\n", + "OUTPUT_DIR = \"./neuro-nearby\"\n", + "\n", + "# === 1. Custom callback for tqdm progress bar ===\n", + "class TQDMProgressBarCallback(TrainerCallback):\n", + " def __init__(self):\n", + " super().__init__()\n", + " self.progress_bar = None\n", + "\n", + " def on_train_begin(self, args, state, control, **kwargs):\n", + " self.total_steps = state.max_steps\n", + " self.progress_bar = tqdm(total=self.total_steps, desc=\"Training\", unit=\"step\")\n", + "\n", + " def on_step_end(self, args, state, control, **kwargs):\n", + " self.progress_bar.update(1)\n", + " self.progress_bar.set_postfix({\n", + " \"epoch\": f\"{state.epoch:.2f}\",\n", + " \"step\": state.global_step\n", + " })\n", + "\n", + " def on_train_end(self, args, state, control, **kwargs):\n", + " if self.progress_bar is not None:\n", + " self.progress_bar.close()\n", + " self.progress_bar = None\n", + "\n", + "# === 2. Load and preprocess data ===\n", + "dataset_path = 'dataset.csv'\n", + "df = pd.read_csv(dataset_path)\n", + "df = df.dropna(subset=['category'])\n", + "df.columns = ['label', 'text'] # Rename columns\n", + "\n", + "# === 3. Encode labels ===\n", + "labels = sorted(df[\"label\"].unique())\n", + "label_to_id = {label: idx for idx, label in enumerate(labels)}\n", + "id_to_label = {idx: label for label, idx in label_to_id.items()}\n", + "df['label'] = df['label'].map(label_to_id)\n", + "\n", + "# === 4. Train-val split ===\n", + "train_texts, val_texts, train_labels, val_labels = train_test_split(\n", + " df['text'].tolist(), df['label'].tolist(), test_size=0.2, random_state=42, stratify=df['label']\n", + ")\n", + "\n", + "# === 5. Tokenizer ===\n", + "tokenizer = BertTokenizer.from_pretrained(MODEL_NAME)\n", + "\n", + "# === 6. Dataset class ===\n", + "class CategoryDataset(Dataset):\n", + " def __init__(self, texts, labels, tokenizer, max_length=128):\n", + " self.texts = texts\n", + " self.labels = labels\n", + " self.tokenizer = tokenizer\n", + " self.max_length = max_length\n", + "\n", + " def __len__(self):\n", + " return len(self.texts)\n", + "\n", + " def __getitem__(self, idx):\n", + " encoding = self.tokenizer(\n", + " self.texts[idx],\n", + " padding='max_length',\n", + " truncation=True,\n", + " max_length=self.max_length,\n", + " return_tensors='pt'\n", + " )\n", + " return {\n", + " 'input_ids': encoding['input_ids'].squeeze(0),\n", + " 'attention_mask': encoding['attention_mask'].squeeze(0),\n", + " 'labels': torch.tensor(self.labels[idx], dtype=torch.long)\n", + " }\n", + "\n", + "# === 7. Load datasets ===\n", + "train_dataset = CategoryDataset(train_texts, train_labels, tokenizer)\n", + "val_dataset = CategoryDataset(val_texts, val_labels, tokenizer)\n", + "\n", + "# === 8. Load model with num_labels ===\n", + "model = BertForSequenceClassification.from_pretrained(\n", + " MODEL_NAME,\n", + " num_labels=len(label_to_id)\n", + ")\n", + "\n", + "# === 9. Define metrics for evaluation ===\n", + "def compute_metrics(eval_pred):\n", + " logits, labels = eval_pred\n", + " predictions = np.argmax(logits, axis=-1)\n", + " acc = accuracy_score(labels, predictions)\n", + " f1 = f1_score(labels, predictions, average='weighted')\n", + " return {\n", + " 'accuracy': acc,\n", + " 'f1_weighted': f1,\n", + " }\n", + "\n", + "# === 10. Training arguments ===\n", + "training_args = TrainingArguments(\n", + " output_dir='./results',\n", + " run_name=\"NeuroNearby\",\n", + " num_train_epochs=5,\n", + " per_device_train_batch_size=16,\n", + " per_device_eval_batch_size=16,\n", + " warmup_steps=500,\n", + " weight_decay=0.01,\n", + " logging_dir='./logs',\n", + " logging_steps=10,\n", + " eval_strategy=\"epoch\", # Corrected from evaluation_strategy\n", + " report_to=\"none\"\n", + ")\n", + "\n", + "\n", + "# === 11. Trainer setup ===\n", + "trainer = Trainer(\n", + " model=model,\n", + " args=training_args,\n", + " train_dataset=train_dataset,\n", + " eval_dataset=val_dataset,\n", + " compute_metrics=compute_metrics,\n", + " callbacks=[TQDMProgressBarCallback()]\n", + ")\n", + "\n", + "# === 12. Train and evaluate ===\n", + "trainer.train()\n", + "trainer.evaluate()\n", + "\n", + "# === 13. Save model and tokenizer ===\n", + "model.config.label2id = label_to_id\n", + "model.config.id2label = id_to_label\n", + "model.config.num_labels = len(label_to_id)\n", + "\n", + "model.save_pretrained(OUTPUT_DIR)\n", + "tokenizer.save_pretrained(OUTPUT_DIR)\n", + "\n", + "# === 14. Zip model directory ===\n", + "shutil.make_archive(\"neuro-nearby\", 'zip', OUTPUT_DIR)\n", + "print(\"✅ Training complete. Model and tokenizer saved to ./neuro-nearby\")\n", + "print(\"✅ Model directory zipped to neuro-nearby.zip\")\n", + "\n", + "# === 15. Test function with confidence threshold ===\n", + "def run_test_cases(model, tokenizer, test_sentences, label_to_id, id_to_label, confidence_threshold=0.5):\n", + " model.eval()\n", + " device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n", + " model.to(device)\n", + "\n", + " correct = 0\n", + " total = len(test_sentences)\n", + " results = []\n", + "\n", + " for text, expected_label in test_sentences:\n", + " encoding = tokenizer(\n", + " text,\n", + " padding='max_length',\n", + " truncation=True,\n", + " max_length=128,\n", + " return_tensors='pt'\n", + " )\n", + " input_ids = encoding['input_ids'].to(device)\n", + " attention_mask = encoding['attention_mask'].to(device)\n", + "\n", + " with torch.no_grad():\n", + " outputs = model(input_ids, attention_mask=attention_mask)\n", + " probs = torch.nn.functional.softmax(outputs.logits, dim=-1)\n", + " max_prob, predicted_id = torch.max(probs, dim=1)\n", + " predicted_label = id_to_label[predicted_id.item()]\n", + " # Apply confidence threshold\n", + " if max_prob.item() < confidence_threshold:\n", + " predicted_label = \"unknown\"\n", + "\n", + " is_correct = (predicted_label == expected_label)\n", + " if is_correct:\n", + " correct += 1\n", + " results.append({\n", + " \"sentence\": text,\n", + " \"expected\": expected_label,\n", + " \"predicted\": predicted_label,\n", + " \"confidence\": max_prob.item(),\n", + " \"correct\": is_correct\n", + " })\n", + "\n", + " accuracy = correct / total * 100\n", + " print(f\"\\nTest Cases Accuracy: {accuracy:.2f}% ({correct}/{total} correct)\")\n", + "\n", + " for r in results:\n", + " status = \"✓\" if r[\"correct\"] else \"✗\"\n", + " print(f\"{status} '{r['sentence']}'\")\n", + " print(f\" Expected: {r['expected']}, Predicted: {r['predicted']}, Confidence: {r['confidence']:.3f}\")\n", + "\n", + " assert accuracy >= 70, f\"Test failed: Accuracy {accuracy:.2f}% < 70%\"\n", + " return results\n", + "\n", + "# === 16. Sample test sentences for testing ===\n", + "test_sentences = [\n", + " (\"Where is the nearest airport to this location?\", \"airport\"),\n", + " (\"Can I bring a laptop through airport security?\", \"airport\"),\n", + " (\"How do I get to the closest airport terminal?\", \"airport\"),\n", + " (\"Need help finding an accounting firm for tax planning.\", \"accounting firm\"),\n", + " (\"Can an accounting firm help with financial audits?\", \"accounting firm\"),\n", + " (\"Looking for an accounting firm to manage payroll.\", \"accounting firm\"),\n", + " # Add more diverse sentences covering your 155 categories\n", + "]\n", + "\n", + "print(\"\\nRunning test cases...\")\n", + "test_results = run_test_cases(model, tokenizer, test_sentences, label_to_id, id_to_label)\n", + "print(\"✅ Test cases completed.\")" + ] + }, + { + "cell_type": "code", + "source": [ + "# === 16. Sample test sentences for testing ===\n", + "test_sentences = [\n", + " (\"show me a store that sells snow shoes\", \"shoe store\"),\n", + " (\"Is there a hotline for reporting a malfunctioning streetlight near City Hall?\", \"city hall\"),\n", + " (\"i need to get my allergy medication refilled\", \"pharmacy\"),\n", + " (\"i have a headache\", \"pharmacy\"),\n", + " (\"Looking for a shop with bike chains.\", \"bicycle store\"),\n", + "]\n", + "print(\"\\nRunning test cases...\")\n", + "test_results = run_test_cases(model, tokenizer, test_sentences, label_to_id, id_to_label)\n", + "print(\"✅ Test cases completed.\")" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "rTKHC6mP4keH", + "outputId": "ef0132e3-321b-4649-87f7-4f9f03000714" + }, + "execution_count": 2, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "\n", + "Running test cases...\n", + "\n", + "Test Cases Accuracy: 100.00% (3/3 correct)\n", + "✓ 'show me a store that sells snow shoes'\n", + " Expected: shoe store, Predicted: shoe store, Confidence: 0.999\n", + "✓ 'Is there a hotline for reporting a malfunctioning streetlight near City Hall?'\n", + " Expected: city hall, Predicted: city hall, Confidence: 1.000\n", + "✓ 'i need to get my allergy medication refilled'\n", + " Expected: pharmacy, Predicted: pharmacy, Confidence: 0.999\n", + "✅ Test cases completed.\n" + ] + } + ] + } + ] +} \ No newline at end of file