{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "provenance": [], "gpuType": "T4" }, "kernelspec": { "name": "python3", "display_name": "Python 3" }, "language_info": { "name": "python" }, "accelerator": "GPU", "widgets": { "application/vnd.jupyter.widget-state+json": { "a997f83e7aa64ad1849d5f622eec145d": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_8889742d12364680a5a39470adde2873", "IPY_MODEL_168e3e4172cc4e36b2ca0544e0fc42b4", "IPY_MODEL_64f694d338294e5984e5895050d947c3" ], "layout": "IPY_MODEL_ce354595738b45eeb03386728d316d69" } }, "8889742d12364680a5a39470adde2873": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_d552cb6203ed4718b0504b6d80de581c", "placeholder": "​", "style": "IPY_MODEL_ae2586c27aa24a0a8c96d88d5d160e70", "value": "Generating train split: " } }, "168e3e4172cc4e36b2ca0544e0fc42b4": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_b414fa4834174262a2608f6dfbe894e5", "max": 1, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_ee5c0c7663a64c3c85ea68373f105b42", "value": 1 } }, "64f694d338294e5984e5895050d947c3": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_0705592b068e4271bcc30a32791a47ca", "placeholder": "​", "style": "IPY_MODEL_151b2379bb6849df8dc75848717e9490", "value": " 57072/0 [00:00<00:00, 275058.13 examples/s]" } }, "ce354595738b45eeb03386728d316d69": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "d552cb6203ed4718b0504b6d80de581c": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "ae2586c27aa24a0a8c96d88d5d160e70": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "b414fa4834174262a2608f6dfbe894e5": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "20px" } }, "ee5c0c7663a64c3c85ea68373f105b42": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "0705592b068e4271bcc30a32791a47ca": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "151b2379bb6849df8dc75848717e9490": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "d7cf2951869343e98322277dd3e52085": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_864b8038624a40e899ddc8ee00d64996", "IPY_MODEL_6d45c0ee7da34f28932ab54699bd4092", "IPY_MODEL_8f86dd9f03214308b2bd9505bf249b80" ], "layout": "IPY_MODEL_c4be6df7bcc34fdc95e5bb6e72eb44ff" } }, "864b8038624a40e899ddc8ee00d64996": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2ef30bae7c1a48329aa944559c539323", "placeholder": "​", "style": "IPY_MODEL_55a90b62a4094cf1afbf8fe183751cf9", "value": "Loading checkpoint shards: 100%" } }, "6d45c0ee7da34f28932ab54699bd4092": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_67db80c7406a4ab7806e05451c234fdd", "max": 3, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_b213c00ebe8243a78b0ca91b40261e33", "value": 3 } }, "8f86dd9f03214308b2bd9505bf249b80": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_3a0bd7815630436982830f05768a52c3", "placeholder": "​", "style": "IPY_MODEL_2ea41b0b43de4c7db6b690d3c53ee578", "value": " 3/3 [01:09<00:00, 22.05s/it]" } }, "c4be6df7bcc34fdc95e5bb6e72eb44ff": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "2ef30bae7c1a48329aa944559c539323": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "55a90b62a4094cf1afbf8fe183751cf9": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "67db80c7406a4ab7806e05451c234fdd": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "b213c00ebe8243a78b0ca91b40261e33": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "3a0bd7815630436982830f05768a52c3": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "2ea41b0b43de4c7db6b690d3c53ee578": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "6952dd69d233420c84f8931cd11d0b94": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_1b90056f7f0a4ad681a025cf5012c607", "IPY_MODEL_8c06c04a4cf44ec396992ae04f7ad53d", "IPY_MODEL_0e09e908da8444eca0c9737dd9c93c34" ], "layout": "IPY_MODEL_f5c7882a83094141b891d5fc8b9cbf17" } }, "1b90056f7f0a4ad681a025cf5012c607": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_2e4a189f134343fe84dd0ed20939055f", "placeholder": "​", "style": "IPY_MODEL_d6dfbb37ef7c4447aaa41cc6f6436163", "value": "Map: 100%" } }, "8c06c04a4cf44ec396992ae04f7ad53d": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_46bf9b6c73c34232a129e28176509b9a", "max": 57072, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_330a4fb368c142a38a538d78cc70cc76", "value": 57072 } }, "0e09e908da8444eca0c9737dd9c93c34": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_6144b49ad9e64ad2a68b4f85396f41bf", "placeholder": "​", "style": "IPY_MODEL_936de9b40ae84efc8b5ecb7ed6172ddd", "value": " 57072/57072 [00:24<00:00, 2290.68 examples/s]" } }, "f5c7882a83094141b891d5fc8b9cbf17": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "2e4a189f134343fe84dd0ed20939055f": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "d6dfbb37ef7c4447aaa41cc6f6436163": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "46bf9b6c73c34232a129e28176509b9a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "330a4fb368c142a38a538d78cc70cc76": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "6144b49ad9e64ad2a68b4f85396f41bf": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "936de9b40ae84efc8b5ecb7ed6172ddd": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "60003cd29e8241c3bd5caeacf7cd5626": { "model_module": "@jupyter-widgets/controls", "model_name": "HBoxModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HBoxModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HBoxView", "box_style": "", "children": [ "IPY_MODEL_0520ce1f42b34a009d21b547a0555215", "IPY_MODEL_602da4d2148142fb9bb34536a6eea10f", "IPY_MODEL_d372b6688dd0414fb39cf3eee89c2ee6" ], "layout": "IPY_MODEL_08d325c87f0343bdbd7f12fff31f254a" } }, "0520ce1f42b34a009d21b547a0555215": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_7cd3bd2d9a584786ad1d7724d2557573", "placeholder": "​", "style": "IPY_MODEL_981ae07b4d4545f1bcbd46d40e6faae9", "value": "Generating train split: " } }, "602da4d2148142fb9bb34536a6eea10f": { "model_module": "@jupyter-widgets/controls", "model_name": "FloatProgressModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "FloatProgressModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "ProgressView", "bar_style": "success", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_ef198ccfca194060861b2a13df189e8a", "max": 1, "min": 0, "orientation": "horizontal", "style": "IPY_MODEL_95c67b1454b64eb897ebce6db7863e10", "value": 1 } }, "d372b6688dd0414fb39cf3eee89c2ee6": { "model_module": "@jupyter-widgets/controls", "model_name": "HTMLModel", "model_module_version": "1.5.0", "state": { "_dom_classes": [], "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "HTMLModel", "_view_count": null, "_view_module": "@jupyter-widgets/controls", "_view_module_version": "1.5.0", "_view_name": "HTMLView", "description": "", "description_tooltip": null, "layout": "IPY_MODEL_dfa1de4875dd472cb3672cd06f760b4e", "placeholder": "​", "style": "IPY_MODEL_8abe94a5621b41188a4d900ce7a72fd5", "value": " 57072/0 [00:00<00:00, 117896.92 examples/s]" } }, "08d325c87f0343bdbd7f12fff31f254a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "7cd3bd2d9a584786ad1d7724d2557573": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "981ae07b4d4545f1bcbd46d40e6faae9": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } }, "ef198ccfca194060861b2a13df189e8a": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": "20px" } }, "95c67b1454b64eb897ebce6db7863e10": { "model_module": "@jupyter-widgets/controls", "model_name": "ProgressStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "ProgressStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "bar_color": null, "description_width": "" } }, "dfa1de4875dd472cb3672cd06f760b4e": { "model_module": "@jupyter-widgets/base", "model_name": "LayoutModel", "model_module_version": "1.2.0", "state": { "_model_module": "@jupyter-widgets/base", "_model_module_version": "1.2.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "overflow_x": null, "overflow_y": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null } }, "8abe94a5621b41188a4d900ce7a72fd5": { "model_module": "@jupyter-widgets/controls", "model_name": "DescriptionStyleModel", "model_module_version": "1.5.0", "state": { "_model_module": "@jupyter-widgets/controls", "_model_module_version": "1.5.0", "_model_name": "DescriptionStyleModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "1.2.0", "_view_name": "StyleView", "description_width": "" } } } } }, "cells": [ { "cell_type": "code", "execution_count": 2, "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "collapsed": true, "id": "mDvF2OeHU4ol", "outputId": "13970a60-9584-45ed-f368-b2e6b537495f" }, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Requirement already satisfied: pandas in /usr/local/lib/python3.12/dist-packages (2.2.2)\n", "Requirement already satisfied: datasets in /usr/local/lib/python3.12/dist-packages (4.0.0)\n", "Requirement already satisfied: transformers in /usr/local/lib/python3.12/dist-packages (4.57.0)\n", "Requirement already satisfied: peft in /usr/local/lib/python3.12/dist-packages (0.17.1)\n", "Requirement already satisfied: accelerate in /usr/local/lib/python3.12/dist-packages (1.10.1)\n", "Collecting bitsandbytes\n", " Downloading bitsandbytes-0.48.1-py3-none-manylinux_2_24_x86_64.whl.metadata (10 kB)\n", "Requirement already satisfied: numpy>=1.26.0 in /usr/local/lib/python3.12/dist-packages (from pandas) (2.0.2)\n", "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.12/dist-packages (from pandas) (2.9.0.post0)\n", "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.12/dist-packages (from pandas) (2025.2)\n", "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.12/dist-packages (from pandas) (2025.2)\n", "Requirement already satisfied: filelock in /usr/local/lib/python3.12/dist-packages (from datasets) (3.20.0)\n", "Requirement already satisfied: pyarrow>=15.0.0 in /usr/local/lib/python3.12/dist-packages (from datasets) (18.1.0)\n", "Requirement already satisfied: dill<0.3.9,>=0.3.0 in /usr/local/lib/python3.12/dist-packages (from datasets) (0.3.8)\n", "Requirement already satisfied: requests>=2.32.2 in /usr/local/lib/python3.12/dist-packages (from datasets) (2.32.4)\n", "Requirement already satisfied: tqdm>=4.66.3 in /usr/local/lib/python3.12/dist-packages (from datasets) (4.67.1)\n", "Requirement already satisfied: xxhash in /usr/local/lib/python3.12/dist-packages (from datasets) (3.6.0)\n", "Requirement already satisfied: multiprocess<0.70.17 in /usr/local/lib/python3.12/dist-packages (from datasets) (0.70.16)\n", "Requirement already satisfied: fsspec<=2025.3.0,>=2023.1.0 in /usr/local/lib/python3.12/dist-packages (from fsspec[http]<=2025.3.0,>=2023.1.0->datasets) (2025.3.0)\n", "Requirement already satisfied: huggingface-hub>=0.24.0 in /usr/local/lib/python3.12/dist-packages (from datasets) (0.35.3)\n", "Requirement already satisfied: packaging in /usr/local/lib/python3.12/dist-packages (from datasets) (25.0)\n", "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.12/dist-packages (from datasets) (6.0.3)\n", "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.12/dist-packages (from transformers) (2024.11.6)\n", "Requirement already satisfied: tokenizers<=0.23.0,>=0.22.0 in /usr/local/lib/python3.12/dist-packages (from transformers) (0.22.1)\n", "Requirement already satisfied: safetensors>=0.4.3 in /usr/local/lib/python3.12/dist-packages (from transformers) (0.6.2)\n", "Requirement already satisfied: psutil in /usr/local/lib/python3.12/dist-packages (from peft) (5.9.5)\n", "Requirement already satisfied: torch>=1.13.0 in /usr/local/lib/python3.12/dist-packages (from peft) (2.8.0+cu126)\n", "Requirement already satisfied: aiohttp!=4.0.0a0,!=4.0.0a1 in /usr/local/lib/python3.12/dist-packages (from fsspec[http]<=2025.3.0,>=2023.1.0->datasets) (3.13.0)\n", "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.12/dist-packages (from huggingface-hub>=0.24.0->datasets) (4.15.0)\n", "Requirement already satisfied: hf-xet<2.0.0,>=1.1.3 in /usr/local/lib/python3.12/dist-packages (from huggingface-hub>=0.24.0->datasets) (1.1.10)\n", "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.12/dist-packages (from python-dateutil>=2.8.2->pandas) (1.17.0)\n", "Requirement already satisfied: charset_normalizer<4,>=2 in /usr/local/lib/python3.12/dist-packages (from requests>=2.32.2->datasets) (3.4.3)\n", "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.12/dist-packages (from requests>=2.32.2->datasets) (3.10)\n", "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.12/dist-packages (from requests>=2.32.2->datasets) (2.5.0)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.12/dist-packages (from requests>=2.32.2->datasets) (2025.10.5)\n", "Requirement already satisfied: setuptools in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (75.2.0)\n", "Requirement already satisfied: sympy>=1.13.3 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (1.13.3)\n", "Requirement already satisfied: networkx in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (3.5)\n", "Requirement already satisfied: jinja2 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (3.1.6)\n", "Requirement already satisfied: nvidia-cuda-nvrtc-cu12==12.6.77 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (12.6.77)\n", "Requirement already satisfied: nvidia-cuda-runtime-cu12==12.6.77 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (12.6.77)\n", "Requirement already satisfied: nvidia-cuda-cupti-cu12==12.6.80 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (12.6.80)\n", "Requirement already satisfied: nvidia-cudnn-cu12==9.10.2.21 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (9.10.2.21)\n", "Requirement already satisfied: nvidia-cublas-cu12==12.6.4.1 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (12.6.4.1)\n", "Requirement already satisfied: nvidia-cufft-cu12==11.3.0.4 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (11.3.0.4)\n", "Requirement already satisfied: nvidia-curand-cu12==10.3.7.77 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (10.3.7.77)\n", "Requirement already satisfied: nvidia-cusolver-cu12==11.7.1.2 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (11.7.1.2)\n", "Requirement already satisfied: nvidia-cusparse-cu12==12.5.4.2 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (12.5.4.2)\n", "Requirement already satisfied: nvidia-cusparselt-cu12==0.7.1 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (0.7.1)\n", "Requirement already satisfied: nvidia-nccl-cu12==2.27.3 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (2.27.3)\n", "Requirement already satisfied: nvidia-nvtx-cu12==12.6.77 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (12.6.77)\n", "Requirement already satisfied: nvidia-nvjitlink-cu12==12.6.85 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (12.6.85)\n", "Requirement already satisfied: nvidia-cufile-cu12==1.11.1.6 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (1.11.1.6)\n", "Requirement already satisfied: triton==3.4.0 in /usr/local/lib/python3.12/dist-packages (from torch>=1.13.0->peft) (3.4.0)\n", "Requirement already satisfied: aiohappyeyeballs>=2.5.0 in /usr/local/lib/python3.12/dist-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.3.0,>=2023.1.0->datasets) (2.6.1)\n", "Requirement already satisfied: aiosignal>=1.4.0 in /usr/local/lib/python3.12/dist-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.3.0,>=2023.1.0->datasets) (1.4.0)\n", "Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.12/dist-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.3.0,>=2023.1.0->datasets) (25.4.0)\n", "Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.12/dist-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.3.0,>=2023.1.0->datasets) (1.8.0)\n", "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.12/dist-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.3.0,>=2023.1.0->datasets) (6.7.0)\n", "Requirement already satisfied: propcache>=0.2.0 in /usr/local/lib/python3.12/dist-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.3.0,>=2023.1.0->datasets) (0.3.2)\n", "Requirement already satisfied: yarl<2.0,>=1.17.0 in /usr/local/lib/python3.12/dist-packages (from aiohttp!=4.0.0a0,!=4.0.0a1->fsspec[http]<=2025.3.0,>=2023.1.0->datasets) (1.22.0)\n", "Requirement already satisfied: mpmath<1.4,>=1.1.0 in /usr/local/lib/python3.12/dist-packages (from sympy>=1.13.3->torch>=1.13.0->peft) (1.3.0)\n", "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.12/dist-packages (from jinja2->torch>=1.13.0->peft) (3.0.3)\n", "Downloading bitsandbytes-0.48.1-py3-none-manylinux_2_24_x86_64.whl (60.1 MB)\n", "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m60.1/60.1 MB\u001b[0m \u001b[31m14.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", "\u001b[?25hInstalling collected packages: bitsandbytes\n", "Successfully installed bitsandbytes-0.48.1\n" ] } ], "source": [ "pip install pandas datasets transformers peft accelerate bitsandbytes\n" ] }, { "cell_type": "code", "source": [ "import pandas as pd\n", "import json\n", "import os\n", "\n", "files = [\n", " \"/content/Stress.csv\",\n", " \"/content/ds.csv\",\n", " \"/content/ocd_patient_dataset.csv\",\n", " \"/content/synthetic_ptsd_patients.csv\",\n", " \"/content/Mental health Depression disorder Data.csv\",\n", " \"/content/Copy of ds.csv\"\n", "]\n", "\n", "question_cols = [\n", " \"question\", \"questions\", \"prompt\", \"input\", \"q\", \"query\", \"text\", \"phrase\"\n", "]\n", "answer_cols = [\n", " \"answer\", \"answers\", \"response\", \"output\", \"a\", \"completion\", \"reply\", \"label\", \"sentiment\"\n", "]\n", "\n", "all_dfs = []\n", "qa_examples = [] # For mental health depression dataset\n", "\n", "for f in files:\n", " ext = os.path.splitext(f)[1].lower()\n", " if ext != \".csv\":\n", " print(f\"⚠️ Skipping non-CSV file: {f}\")\n", " continue\n", "\n", " try:\n", " try:\n", " df = pd.read_csv(f, encoding=\"utf-8\")\n", " except UnicodeDecodeError:\n", " df = pd.read_csv(f, encoding=\"latin1\")\n", " except Exception as e:\n", " print(f\"⚠️ Could not read {f}: {e}\")\n", " continue\n", "\n", " df.columns = [c.strip() for c in df.columns]\n", "\n", " # Process Mental health Depression disorder Data.csv using your working snippet\n", " if os.path.basename(f) == \"Mental health Depression disorder Data.csv\":\n", " disorder_cols = [\n", " 'Schizophrenia (%)',\n", " 'Bipolar disorder (%)',\n", " 'Eating disorders (%)',\n", " 'Anxiety disorders (%)',\n", " 'Drug use disorders (%)',\n", " 'Depression (%)',\n", " 'Alcohol use disorders (%)'\n", " ]\n", "\n", " for _, row in df.iterrows():\n", " entity = row['Entity']\n", " year = row['Year']\n", " for disorder in disorder_cols:\n", " value = row[disorder]\n", " if pd.isna(value):\n", " continue\n", " question = f\"What is the percentage of {disorder.replace(' (%)', '')} in {entity} for year {year}?\"\n", " answer = f\"{value}%\"\n", " qa_examples.append({\n", " \"instruction\": question,\n", " \"input\": \"\",\n", " \"output\": answer\n", " })\n", " print(f\"✅ Generated {len(qa_examples)} Q&A examples from {f}\")\n", "\n", " elif os.path.basename(f) == \"ocd_patient_dataset.csv\":\n", " if \"Obsession Type\" in df.columns and \"Compulsion Type\" in df.columns:\n", " df_sub = df[[\"Obsession Type\", \"Compulsion Type\"]].rename(columns={\n", " \"Obsession Type\": \"Question\",\n", " \"Compulsion Type\": \"Answer\"\n", " })\n", " df_sub = df_sub.dropna(subset=[\"Question\", \"Answer\"])\n", " all_dfs.append(df_sub)\n", " print(f\"✅ Loaded {len(df_sub)} rows from {f}\")\n", " else:\n", " print(f\"⚠️ Skipping {f}: Missing 'Obsession Type' or 'Compulsion Type' columns\")\n", "\n", " elif os.path.basename(f) == \"synthetic_ptsd_patients.csv\":\n", " if \"trauma_type\" in df.columns and \"has_ptsd\" in df.columns:\n", " df_sub = df[[\"trauma_type\", \"has_ptsd\"]].rename(columns={\n", " \"trauma_type\": \"Question\",\n", " \"has_ptsd\": \"Answer\"\n", " })\n", " df_sub = df_sub.dropna(subset=[\"Question\", \"Answer\"])\n", " all_dfs.append(df_sub)\n", " print(f\"✅ Loaded {len(df_sub)} rows from {f}\")\n", " else:\n", " print(f\"⚠️ Skipping {f}: Missing 'trauma_type' or 'has_ptsd' columns\")\n", "\n", " else:\n", " # Generic Q&A detection for other files\n", " df.columns = [c.lower() for c in df.columns] # normalize for matching\n", " q_col = next((c for c in df.columns if c in [qc.lower() for qc in question_cols]), None)\n", " a_col = next((c for c in df.columns if c in [ac.lower() for ac in answer_cols]), None)\n", " if not q_col or not a_col:\n", " print(f\"⚠️ Skipping {f}: Missing 'Question' or 'Answer' column\")\n", " continue\n", " df_sub = df[[q_col, a_col]].rename(columns={q_col: \"Question\", a_col: \"Answer\"})\n", " df_sub = df_sub.dropna(subset=[\"Question\", \"Answer\"])\n", " all_dfs.append(df_sub)\n", " print(f\"✅ Loaded {len(df_sub)} rows from {f}\")\n", "\n", "# Combine normal Q/A datasets\n", "if all_dfs:\n", " df_combined = pd.concat(all_dfs, ignore_index=True)\n", "else:\n", " df_combined = pd.DataFrame(columns=[\"Question\", \"Answer\"])\n", "\n", "# Write all data to JSONL\n", "with open(\"training_data.jsonl\", \"w\", encoding=\"utf-8\") as f_out:\n", " for _, row in df_combined.iterrows():\n", " q = str(row[\"Question\"]).strip()\n", " a = str(row[\"Answer\"]).strip()\n", " if q and a:\n", " example = {\"instruction\": q, \"input\": \"\", \"output\": a}\n", " f_out.write(json.dumps(example, ensure_ascii=False) + \"\\n\")\n", "\n", " for example in qa_examples:\n", " f_out.write(json.dumps(example, ensure_ascii=False) + \"\\n\")\n", "\n", "total = len(df_combined) + len(qa_examples)\n", "print(f\"✅ Saved merged dataset with {total} examples to training_data.jsonl\")\n" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/" }, "id": "Xysu5AtqZ9mn", "outputId": "6466af2a-424d-45d4-ab7f-6b9ae379001c" }, "execution_count": 3, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "✅ Loaded 2838 rows from /content/Stress.csv\n", "✅ Loaded 3479 rows from /content/ds.csv\n", "✅ Loaded 1500 rows from /content/ocd_patient_dataset.csv\n", "✅ Loaded 500 rows from /content/synthetic_ptsd_patients.csv\n", "✅ Generated 45276 Q&A examples from /content/Mental health Depression disorder Data.csv\n", "✅ Loaded 3479 rows from /content/Copy of ds.csv\n", "✅ Saved merged dataset with 57072 examples to training_data.jsonl\n" ] } ] }, { "cell_type": "code", "source": [ "# Show head of each loaded CSV / processed DF\n", "for f in files:\n", " ext = os.path.splitext(f)[1].lower()\n", " if ext != \".csv\":\n", " continue\n", "\n", " try:\n", " try:\n", " df = pd.read_csv(f, encoding=\"utf-8\")\n", " except UnicodeDecodeError:\n", " df = pd.read_csv(f, encoding=\"latin1\")\n", " except Exception as e:\n", " print(f\"⚠️ Could not read {f}: {e}\")\n", " continue\n", "\n", " print(f\"\\n📄 Head of {os.path.basename(f)}:\")\n", " display(df.head(5)) # top 5 rows\n" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 1000 }, "id": "FNvKM7TRZbRJ", "outputId": "00eb85c6-f5de-418e-dd96-4f6268504a57" }, "execution_count": 4, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "\n", "📄 Head of Stress.csv:\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ " subreddit post_id sentence_range \\\n", "0 ptsd 8601tu (15, 20) \n", "1 assistance 8lbrx9 (0, 5) \n", "2 ptsd 9ch1zh (15, 20) \n", "3 relationships 7rorpp [5, 10] \n", "4 survivorsofabuse 9p2gbc [0, 5] \n", "\n", " text label confidence \\\n", "0 He said he had not felt that way before, sugge... 1 0.8 \n", "1 Hey there r/assistance, Not sure if this is th... 0 1.0 \n", "2 My mom then hit me with the newspaper and it s... 1 0.8 \n", "3 until i met my new boyfriend, he is amazing, h... 1 0.6 \n", "4 October is Domestic Violence Awareness Month a... 1 0.8 \n", "\n", " social_timestamp \n", "0 1521614353 \n", "1 1527009817 \n", "2 1535935605 \n", "3 1516429555 \n", "4 1539809005 " ], "text/html": [ "\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
subredditpost_idsentence_rangetextlabelconfidencesocial_timestamp
0ptsd8601tu(15, 20)He said he had not felt that way before, sugge...10.81521614353
1assistance8lbrx9(0, 5)Hey there r/assistance, Not sure if this is th...01.01527009817
2ptsd9ch1zh(15, 20)My mom then hit me with the newspaper and it s...10.81535935605
3relationships7rorpp[5, 10]until i met my new boyfriend, he is amazing, h...10.61516429555
4survivorsofabuse9p2gbc[0, 5]October is Domestic Violence Awareness Month a...10.81539809005
\n", "
\n", "
\n", "\n", "
\n", " \n", "\n", " \n", "\n", " \n", "
\n", "\n", "\n", "
\n", " \n", "\n", "\n", "\n", " \n", "
\n", "\n", "
\n", "
\n" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "dataframe", "summary": "{\n \"name\": \" display(df\",\n \"rows\": 5,\n \"fields\": [\n {\n \"column\": \"subreddit\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 4,\n \"samples\": [\n \"assistance\",\n \"survivorsofabuse\",\n \"ptsd\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"post_id\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 5,\n \"samples\": [\n \"8lbrx9\",\n \"9p2gbc\",\n \"9ch1zh\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"sentence_range\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 4,\n \"samples\": [\n \"(0, 5)\",\n \"[0, 5]\",\n \"(15, 20)\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"text\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 5,\n \"samples\": [\n \"Hey there r/assistance, Not sure if this is the right place to post this.. but here goes =) I'm currently a student intern at Sandia National Labs and working on a survey to help improve our marketing outreach efforts at the many schools we recruit at around the country. We're looking for current undergrad/grad STEM students so if you're a STEM student or know STEM students, I would greatly appreciate if you can help take or pass along this short survey. As a thank you, everyone who helps take the survey will be entered in to a drawing for chance to win one of three $50 Amazon gcs.\",\n \"October is Domestic Violence Awareness Month and I am a domestic violence survivor who is still struggling, even after over four years. Lately I have been feeling very angry. Angry that my abusive ex received no real consequences for his actions. This man abused me in all manners: physically, sexually, emotionally, verbally, financially, etc. I was granted a restraining order against him (and it was renewed a year later) but I was unable to press criminal charges against him because I didn\\u2019t have enough evidence to have a case.\",\n \"My mom then hit me with the newspaper and it shocked me that she would do this, she knows I don't like play hitting, smacking, striking, hitting or violence of any sort on my person. Do I send out this vibe asking for it from the universe? Then yesterday I decided to take my friend to go help another \\\"friend\\\" move to a new place. While we were driving the friend we are moving strikes me on my shoulder. And I address it immediately because this is the 4th time I have told him not to do these things, then my other friend who is driving nearly gets into an collision with another car i think because he was high on marijuana and the friend we are moving in the backseat is like \\\"you have to understand I was just trying to get your attention\\\" you know the thing 5 year olds do to get peoples attention by smacking them, this guy is in his 60's.\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"label\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n \"max\": 1,\n \"num_unique_values\": 2,\n \"samples\": [\n 0,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"confidence\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.14142135623730953,\n \"min\": 0.6,\n \"max\": 1.0,\n \"num_unique_values\": 3,\n \"samples\": [\n 0.8,\n 1.0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"social_timestamp\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 9720225,\n \"min\": 1516429555,\n \"max\": 1539809005,\n \"num_unique_values\": 5,\n \"samples\": [\n 1527009817,\n 1539809005\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}" } }, "metadata": {} }, { "output_type": "stream", "name": "stdout", "text": [ "\n", "📄 Head of ds.csv:\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ " phrase sentiment\n", "0 \"I love spending time with my family.\" positive\n", "1 \"Sunshine always brightens my day.\" positive\n", "2 \"Helping others is so rewarding.\" positive\n", "3 \"A good book can transport you to another world.\" positive\n", "4 \"The smell of freshly baked bread is amazing.\" positive" ], "text/html": [ "\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
phrasesentiment
0\"I love spending time with my family.\"positive
1\"Sunshine always brightens my day.\"positive
2\"Helping others is so rewarding.\"positive
3\"A good book can transport you to another world.\"positive
4\"The smell of freshly baked bread is amazing.\"positive
\n", "
\n", "
\n", "\n", "
\n", " \n", "\n", " \n", "\n", " \n", "
\n", "\n", "\n", "
\n", " \n", "\n", "\n", "\n", " \n", "
\n", "\n", "
\n", "
\n" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "dataframe", "summary": "{\n \"name\": \" display(df\",\n \"rows\": 5,\n \"fields\": [\n {\n \"column\": \"phrase\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 5,\n \"samples\": [\n \"\\\"Sunshine always brightens my day.\\\"\",\n \"\\\"The smell of freshly baked bread is amazing.\\\"\",\n \"\\\"Helping others is so rewarding.\\\"\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"sentiment\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 1,\n \"samples\": [\n \"positive\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}" } }, "metadata": {} }, { "output_type": "stream", "name": "stdout", "text": [ "\n", "📄 Head of ocd_patient_dataset.csv:\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ " Patient ID Age Gender Ethnicity Marital Status Education Level \\\n", "0 1018 32 Female African Single Some College \n", "1 2406 69 Male African Divorced Some College \n", "2 1188 57 Male Hispanic Divorced College Degree \n", "3 6200 27 Female Hispanic Married College Degree \n", "4 5824 56 Female Hispanic Married High School \n", "\n", " OCD Diagnosis Date Duration of Symptoms (months) Previous Diagnoses \\\n", "0 2016-07-15 203 MDD \n", "1 2017-04-28 180 NaN \n", "2 2018-02-02 173 MDD \n", "3 2014-08-25 126 PTSD \n", "4 2022-02-20 168 PTSD \n", "\n", " Family History of OCD Obsession Type Compulsion Type \\\n", "0 No Harm-related Checking \n", "1 Yes Harm-related Washing \n", "2 No Contamination Checking \n", "3 Yes Symmetry Washing \n", "4 Yes Hoarding Ordering \n", "\n", " Y-BOCS Score (Obsessions) Y-BOCS Score (Compulsions) Depression Diagnosis \\\n", "0 17 10 Yes \n", "1 21 25 Yes \n", "2 3 4 No \n", "3 14 28 Yes \n", "4 39 18 No \n", "\n", " Anxiety Diagnosis Medications \n", "0 Yes SNRI \n", "1 Yes SSRI \n", "2 No Benzodiazepine \n", "3 Yes SSRI \n", "4 No NaN " ], "text/html": [ "\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
Patient IDAgeGenderEthnicityMarital StatusEducation LevelOCD Diagnosis DateDuration of Symptoms (months)Previous DiagnosesFamily History of OCDObsession TypeCompulsion TypeY-BOCS Score (Obsessions)Y-BOCS Score (Compulsions)Depression DiagnosisAnxiety DiagnosisMedications
0101832FemaleAfricanSingleSome College2016-07-15203MDDNoHarm-relatedChecking1710YesYesSNRI
1240669MaleAfricanDivorcedSome College2017-04-28180NaNYesHarm-relatedWashing2125YesYesSSRI
2118857MaleHispanicDivorcedCollege Degree2018-02-02173MDDNoContaminationChecking34NoNoBenzodiazepine
3620027FemaleHispanicMarriedCollege Degree2014-08-25126PTSDYesSymmetryWashing1428YesYesSSRI
4582456FemaleHispanicMarriedHigh School2022-02-20168PTSDYesHoardingOrdering3918NoNoNaN
\n", "
\n", "
\n", "\n", "
\n", " \n", "\n", " \n", "\n", " \n", "
\n", "\n", "\n", "
\n", " \n", "\n", "\n", "\n", " \n", "
\n", "\n", "
\n", "
\n" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "dataframe", "summary": "{\n \"name\": \" display(df\",\n \"rows\": 5,\n \"fields\": [\n {\n \"column\": \"Patient ID\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 2512,\n \"min\": 1018,\n \"max\": 6200,\n \"num_unique_values\": 5,\n \"samples\": [\n 2406,\n 5824,\n 1188\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Age\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 17,\n \"min\": 27,\n \"max\": 69,\n \"num_unique_values\": 5,\n \"samples\": [\n 69,\n 56,\n 57\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Gender\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"Male\",\n \"Female\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Ethnicity\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"Hispanic\",\n \"African\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Marital Status\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 3,\n \"samples\": [\n \"Single\",\n \"Divorced\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Education Level\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 3,\n \"samples\": [\n \"Some College\",\n \"College Degree\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"OCD Diagnosis Date\",\n \"properties\": {\n \"dtype\": \"object\",\n \"num_unique_values\": 5,\n \"samples\": [\n \"2017-04-28\",\n \"2022-02-20\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Duration of Symptoms (months)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 28,\n \"min\": 126,\n \"max\": 203,\n \"num_unique_values\": 5,\n \"samples\": [\n 180,\n 168\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Previous Diagnoses\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"PTSD\",\n \"MDD\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Family History of OCD\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"Yes\",\n \"No\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Obsession Type\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 4,\n \"samples\": [\n \"Contamination\",\n \"Hoarding\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Compulsion Type\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 3,\n \"samples\": [\n \"Checking\",\n \"Washing\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Y-BOCS Score (Obsessions)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 13,\n \"min\": 3,\n \"max\": 39,\n \"num_unique_values\": 5,\n \"samples\": [\n 21,\n 39\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Y-BOCS Score (Compulsions)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 10,\n \"min\": 4,\n \"max\": 28,\n \"num_unique_values\": 5,\n \"samples\": [\n 25,\n 18\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Depression Diagnosis\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"No\",\n \"Yes\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Anxiety Diagnosis\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"No\",\n \"Yes\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Medications\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 3,\n \"samples\": [\n \"SNRI\",\n \"SSRI\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}" } }, "metadata": {} }, { "output_type": "stream", "name": "stdout", "text": [ "\n", "📄 Head of synthetic_ptsd_patients.csv:\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ " patient_id age gender trauma_type intrusive_thoughts nightmares \\\n", "0 1 56 Female Accident 2 3 \n", "1 2 69 Male Combat-related 4 1 \n", "2 3 46 Male Other 2 3 \n", "3 4 32 Female Other 1 1 \n", "4 5 60 Male Natural disaster 0 4 \n", "\n", " avoidance negative_mood hypervigilance pcl5_score has_ptsd \n", "0 3 1 4 52 1 \n", "1 2 1 4 48 1 \n", "2 4 2 1 48 1 \n", "3 3 0 4 27 0 \n", "4 4 0 4 36 1 " ], "text/html": [ "\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
patient_idagegendertrauma_typeintrusive_thoughtsnightmaresavoidancenegative_moodhypervigilancepcl5_scorehas_ptsd
0156FemaleAccident23314521
1269MaleCombat-related41214481
2346MaleOther23421481
3432FemaleOther11304270
4560MaleNatural disaster04404361
\n", "
\n", "
\n", "\n", "
\n", " \n", "\n", " \n", "\n", " \n", "
\n", "\n", "\n", "
\n", " \n", "\n", "\n", "\n", " \n", "
\n", "\n", "
\n", "
\n" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "dataframe", "summary": "{\n \"name\": \" display(df\",\n \"rows\": 5,\n \"fields\": [\n {\n \"column\": \"patient_id\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 1,\n \"min\": 1,\n \"max\": 5,\n \"num_unique_values\": 5,\n \"samples\": [\n 2,\n 5,\n 3\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"age\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 14,\n \"min\": 32,\n \"max\": 69,\n \"num_unique_values\": 5,\n \"samples\": [\n 69,\n 60,\n 46\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"gender\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 2,\n \"samples\": [\n \"Male\",\n \"Female\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"trauma_type\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 4,\n \"samples\": [\n \"Combat-related\",\n \"Natural disaster\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"intrusive_thoughts\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 1,\n \"min\": 0,\n \"max\": 4,\n \"num_unique_values\": 4,\n \"samples\": [\n 4,\n 0\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"nightmares\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 1,\n \"min\": 1,\n \"max\": 4,\n \"num_unique_values\": 3,\n \"samples\": [\n 3,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"avoidance\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 2,\n \"max\": 4,\n \"num_unique_values\": 3,\n \"samples\": [\n 3,\n 2\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"negative_mood\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n \"max\": 2,\n \"num_unique_values\": 3,\n \"samples\": [\n 1,\n 2\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"hypervigilance\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 1,\n \"min\": 1,\n \"max\": 4,\n \"num_unique_values\": 2,\n \"samples\": [\n 1,\n 4\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"pcl5_score\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 10,\n \"min\": 27,\n \"max\": 52,\n \"num_unique_values\": 4,\n \"samples\": [\n 48,\n 36\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"has_ptsd\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0,\n \"min\": 0,\n \"max\": 1,\n \"num_unique_values\": 2,\n \"samples\": [\n 0,\n 1\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}" } }, "metadata": {} }, { "output_type": "stream", "name": "stdout", "text": [ "\n", "📄 Head of Mental health Depression disorder Data.csv:\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ " Entity Code Year Schizophrenia (%) Bipolar disorder (%) \\\n", "0 Afghanistan AFG 1990 0.160560 0.697779 \n", "1 Afghanistan AFG 1991 0.160312 0.697961 \n", "2 Afghanistan AFG 1992 0.160135 0.698107 \n", "3 Afghanistan AFG 1993 0.160037 0.698257 \n", "4 Afghanistan AFG 1994 0.160022 0.698469 \n", "\n", " Eating disorders (%) Anxiety disorders (%) Drug use disorders (%) \\\n", "0 0.101855 4.828830 1.677082 \n", "1 0.099313 4.829740 1.684746 \n", "2 0.096692 4.831108 1.694334 \n", "3 0.094336 4.830864 1.705320 \n", "4 0.092439 4.829423 1.716069 \n", "\n", " Depression (%) Alcohol use disorders (%) \n", "0 4.071831 0.672404 \n", "1 4.079531 0.671768 \n", "2 4.088358 0.670644 \n", "3 4.096190 0.669738 \n", "4 4.099582 0.669260 " ], "text/html": [ "\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
EntityCodeYearSchizophrenia (%)Bipolar disorder (%)Eating disorders (%)Anxiety disorders (%)Drug use disorders (%)Depression (%)Alcohol use disorders (%)
0AfghanistanAFG19900.1605600.6977790.1018554.8288301.6770824.0718310.672404
1AfghanistanAFG19910.1603120.6979610.0993134.8297401.6847464.0795310.671768
2AfghanistanAFG19920.1601350.6981070.0966924.8311081.6943344.0883580.670644
3AfghanistanAFG19930.1600370.6982570.0943364.8308641.7053204.0961900.669738
4AfghanistanAFG19940.1600220.6984690.0924394.8294231.7160694.0995820.669260
\n", "
\n", "
\n", "\n", "
\n", " \n", "\n", " \n", "\n", " \n", "
\n", "\n", "\n", "
\n", " \n", "\n", "\n", "\n", " \n", "
\n", "\n", "
\n", "
\n" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "dataframe", "summary": "{\n \"name\": \" display(df\",\n \"rows\": 5,\n \"fields\": [\n {\n \"column\": \"Entity\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 1,\n \"samples\": [\n \"Afghanistan\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Code\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 1,\n \"samples\": [\n \"AFG\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Year\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 1,\n \"min\": 1990,\n \"max\": 1994,\n \"num_unique_values\": 5,\n \"samples\": [\n 1991\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Schizophrenia (%)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.00022538296141507444,\n \"min\": 0.160022297338,\n \"max\": 0.160559542157,\n \"num_unique_values\": 5,\n \"samples\": [\n 0.16031189863\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Bipolar disorder (%)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.0002655595027180787,\n \"min\": 0.697779384535,\n \"max\": 0.69846911816,\n \"num_unique_values\": 5,\n \"samples\": [\n 0.697960594942\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Eating disorders (%)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.003771125331541788,\n \"min\": 0.0924393209042,\n \"max\": 0.101854863459,\n \"num_unique_values\": 5,\n \"samples\": [\n 0.0993127900960999\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Anxiety disorders (%)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.0009674370993802713,\n \"min\": 4.82882970499999,\n \"max\": 4.83110836569,\n \"num_unique_values\": 5,\n \"samples\": [\n 4.82974037241\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Drug use disorders (%)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.015618469098137576,\n \"min\": 1.67708194479,\n \"max\": 1.71606858137,\n \"num_unique_values\": 5,\n \"samples\": [\n 1.68474573106\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Depression (%)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.01151549909830738,\n \"min\": 4.07183117706,\n \"max\": 4.09958157816,\n \"num_unique_values\": 5,\n \"samples\": [\n 4.07953093539999\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"Alcohol use disorders (%)\",\n \"properties\": {\n \"dtype\": \"number\",\n \"std\": 0.0013255693766667934,\n \"min\": 0.669259592734,\n \"max\": 0.672404086186,\n \"num_unique_values\": 5,\n \"samples\": [\n 0.671768123935\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}" } }, "metadata": {} }, { "output_type": "stream", "name": "stdout", "text": [ "\n", "📄 Head of Copy of ds.csv:\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ " phrase sentiment\n", "0 \"I love spending time with my family.\" positive\n", "1 \"Sunshine always brightens my day.\" positive\n", "2 \"Helping others is so rewarding.\" positive\n", "3 \"A good book can transport you to another world.\" positive\n", "4 \"The smell of freshly baked bread is amazing.\" positive" ], "text/html": [ "\n", "
\n", "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
phrasesentiment
0\"I love spending time with my family.\"positive
1\"Sunshine always brightens my day.\"positive
2\"Helping others is so rewarding.\"positive
3\"A good book can transport you to another world.\"positive
4\"The smell of freshly baked bread is amazing.\"positive
\n", "
\n", "
\n", "\n", "
\n", " \n", "\n", " \n", "\n", " \n", "
\n", "\n", "\n", "
\n", " \n", "\n", "\n", "\n", " \n", "
\n", "\n", "
\n", "
\n" ], "application/vnd.google.colaboratory.intrinsic+json": { "type": "dataframe", "summary": "{\n \"name\": \" display(df\",\n \"rows\": 5,\n \"fields\": [\n {\n \"column\": \"phrase\",\n \"properties\": {\n \"dtype\": \"string\",\n \"num_unique_values\": 5,\n \"samples\": [\n \"\\\"Sunshine always brightens my day.\\\"\",\n \"\\\"The smell of freshly baked bread is amazing.\\\"\",\n \"\\\"Helping others is so rewarding.\\\"\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n },\n {\n \"column\": \"sentiment\",\n \"properties\": {\n \"dtype\": \"category\",\n \"num_unique_values\": 1,\n \"samples\": [\n \"positive\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}" } }, "metadata": {} } ] }, { "cell_type": "code", "source": [ "from datasets import load_dataset\n", "\n", "# Load the JSONL dataset\n", "dataset = load_dataset(\n", " \"json\",\n", " data_files=\"/content/training_data.jsonl\", # or training_data.jsonl\n", " split=\"train\"\n", ")\n", "\n", "print(dataset[0]) # preview first item\n" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 86, "referenced_widgets": [ "60003cd29e8241c3bd5caeacf7cd5626", "0520ce1f42b34a009d21b547a0555215", "602da4d2148142fb9bb34536a6eea10f", "d372b6688dd0414fb39cf3eee89c2ee6", "08d325c87f0343bdbd7f12fff31f254a", "7cd3bd2d9a584786ad1d7724d2557573", "981ae07b4d4545f1bcbd46d40e6faae9", "ef198ccfca194060861b2a13df189e8a", "95c67b1454b64eb897ebce6db7863e10", "dfa1de4875dd472cb3672cd06f760b4e", "8abe94a5621b41188a4d900ce7a72fd5" ] }, "id": "7ab9H8n9S6Qg", "outputId": "7f39f974-2d8d-4331-fe28-31c0cd231710" }, "execution_count": 6, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "Generating train split: 0 examples [00:00, ? examples/s]" ], "application/vnd.jupyter.widget-view+json": { "version_major": 2, "version_minor": 0, "model_id": "60003cd29e8241c3bd5caeacf7cd5626" } }, "metadata": {} }, { "output_type": "stream", "name": "stdout", "text": [ "{'instruction': 'He said he had not felt that way before, suggeted I go rest and so ..TRIGGER AHEAD IF YOUI\\'RE A HYPOCONDRIAC LIKE ME: i decide to look up \"feelings of doom\" in hopes of maybe getting sucked into some rabbit hole of ludicrous conspiracy, a stupid \"are you psychic\" test or new age b.s., something I could even laugh at down the road. No, I ended up reading that this sense of doom can be indicative of various health ailments; one of which I am prone to.. So on top of my \"doom\" to my gloom..I am now f\\'n worried about my heart. I do happen to have a physical in 48 hours.', 'input': '', 'output': '1'}\n" ] } ] }, { "cell_type": "code", "source": [ "import torch\n", "torch.cuda.empty_cache()\n" ], "metadata": { "id": "UVYcx_zagCjn" }, "execution_count": 7, "outputs": [] }, { "cell_type": "code", "source": [ "import os\n", "os.environ[\"PYTORCH_CUDA_ALLOC_CONF\"] = \"max_split_size_mb:128\"\n" ], "metadata": { "id": "2lZ2A97_gEx4" }, "execution_count": null, "outputs": [] }, { "cell_type": "code", "source": [ "from datasets import load_dataset\n", "from transformers import AutoTokenizer, AutoModelForCausalLM, Trainer, TrainingArguments, BitsAndBytesConfig\n", "from peft import LoraConfig, get_peft_model\n", "import torch\n", "\n", "model_name = \"tanusrich/Mental_Health_Chatbot\"\n", "data_path = \"training_data.jsonl\"\n", "\n", "# Load dataset\n", "dataset = load_dataset(\"json\", data_files=data_path, split=\"train\")\n", "\n", "# Load tokenizer and model with 4-bit quantization using BitsAndBytesConfig (new way)\n", "bnb_config = BitsAndBytesConfig(load_in_4bit=True)\n", "\n", "tokenizer = AutoTokenizer.from_pretrained(model_name)\n", "model = AutoModelForCausalLM.from_pretrained(\n", " model_name,\n", " quantization_config=bnb_config,\n", " device_map=\"auto\",\n", " torch_dtype=torch.float16, # Added this parameter\n", ")\n", "\n", "# LoRA configuration for LLaMA-based model\n", "lora_config = LoraConfig(\n", " r=64,\n", " lora_alpha=16,\n", " target_modules=[\"q_proj\", \"v_proj\"], # typical for LLaMA\n", " lora_dropout=0.1,\n", " bias=\"none\",\n", " task_type=\"CAUSAL_LM\"\n", ")\n", "\n", "model = get_peft_model(model, lora_config)\n", "\n", "# Tokenization helper (fixed)\n", "def preprocess(examples):\n", " inputs = [\n", " instr + \"\\n\" + inp if inp else instr\n", " for instr, inp in zip(\n", " examples[\"instruction\"],\n", " examples.get(\"input\", [\"\"] * len(examples[\"instruction\"]))\n", " )\n", " ]\n", " outputs = examples[\"output\"]\n", "\n", " model_inputs = tokenizer(inputs, max_length=512, truncation=True, padding=\"max_length\")\n", " labels = tokenizer(outputs, max_length=512, truncation=True, padding=\"max_length\").input_ids\n", "\n", " model_inputs[\"labels\"] = labels\n", " return model_inputs\n", "\n", "# Apply preprocessing\n", "tokenized_dataset = dataset.map(\n", " preprocess,\n", " batched=True,\n", " remove_columns=dataset.column_names,\n", ")\n", "\n", "# Training arguments\n", "training_args = TrainingArguments(\n", " output_dir=\"./lora_mht_chatbot_finetuned\",\n", " per_device_train_batch_size=1, # Reduced batch size\n", " gradient_accumulation_steps=4, # Adjusted accumulation steps\n", " num_train_epochs=3,\n", " learning_rate=3e-4,\n", " fp16=True,\n", " save_strategy=\"epoch\",\n", " optim=\"paged_adamw_32bit\",\n", " logging_steps=10,\n", " save_total_limit=2,\n", " report_to=\"none\",\n", ")\n", "\n", "# Trainer\n", "trainer = Trainer(\n", " model=model,\n", " args=training_args,\n", " train_dataset=tokenized_dataset,\n", " tokenizer=tokenizer,\n", ")\n", "\n", "trainer.train()\n", "\n", "# Save adapters and tokenizer\n", "model.save_pretrained(\"./lora_mht_chatbot_finetuned\")\n", "tokenizer.save_pretrained(\"./lora_mht_chatbot_finetuned\")\n", "\n", "print(\"✅ Fine-tuning complete and saved!\")" ], "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 1000, "referenced_widgets": [ "a997f83e7aa64ad1849d5f622eec145d", "8889742d12364680a5a39470adde2873", "168e3e4172cc4e36b2ca0544e0fc42b4", "64f694d338294e5984e5895050d947c3", "ce354595738b45eeb03386728d316d69", "d552cb6203ed4718b0504b6d80de581c", "ae2586c27aa24a0a8c96d88d5d160e70", "b414fa4834174262a2608f6dfbe894e5", "ee5c0c7663a64c3c85ea68373f105b42", "0705592b068e4271bcc30a32791a47ca", "151b2379bb6849df8dc75848717e9490", "d7cf2951869343e98322277dd3e52085", "864b8038624a40e899ddc8ee00d64996", "6d45c0ee7da34f28932ab54699bd4092", "8f86dd9f03214308b2bd9505bf249b80", "c4be6df7bcc34fdc95e5bb6e72eb44ff", "2ef30bae7c1a48329aa944559c539323", "55a90b62a4094cf1afbf8fe183751cf9", "67db80c7406a4ab7806e05451c234fdd", "b213c00ebe8243a78b0ca91b40261e33", "3a0bd7815630436982830f05768a52c3", "2ea41b0b43de4c7db6b690d3c53ee578", "6952dd69d233420c84f8931cd11d0b94", "1b90056f7f0a4ad681a025cf5012c607", "8c06c04a4cf44ec396992ae04f7ad53d", "0e09e908da8444eca0c9737dd9c93c34", "f5c7882a83094141b891d5fc8b9cbf17", "2e4a189f134343fe84dd0ed20939055f", "d6dfbb37ef7c4447aaa41cc6f6436163", "46bf9b6c73c34232a129e28176509b9a", "330a4fb368c142a38a538d78cc70cc76", "6144b49ad9e64ad2a68b4f85396f41bf", "936de9b40ae84efc8b5ecb7ed6172ddd" ] }, "id": "beEGorh7eN3I", "outputId": "0055144c-85fb-422d-dbb2-d49b60a4e49e" }, "execution_count": null, "outputs": [ { "output_type": "display_data", "data": { "text/plain": [ "Generating train split: 0 examples [00:00, ? examples/s]" ], "application/vnd.jupyter.widget-view+json": { "version_major": 2, "version_minor": 0, "model_id": "a997f83e7aa64ad1849d5f622eec145d" } }, "metadata": {} }, { "output_type": "stream", "name": "stderr", "text": [ "`torch_dtype` is deprecated! Use `dtype` instead!\n" ] }, { "output_type": "display_data", "data": { "text/plain": [ "Loading checkpoint shards: 0%| | 0/3 [00:00" ], "text/html": [ "\n", "
\n", " \n", " \n", " [ 743/42804 1:02:40 < 59:17:37, 0.20 it/s, Epoch 0.05/3]\n", "
\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
StepTraining Loss
1023.653100
2023.332900
3023.227600
4023.208500
5023.424900
6023.403100
7023.305700
8023.368200
9023.283600
10023.233000
11023.211700
12023.203100
13023.178200
14023.331000
15023.031700
16023.388000
17023.361600
18023.361800
19023.193500
20023.318700
21023.331800
22023.256900
23023.349100
24023.115400
25023.023700
26023.321400
27022.990600
28023.115500
29023.204400
30023.366000
31022.765200
32023.341900
33023.242800
34023.098100
35023.304000
36023.417000
37023.369900
38023.214200
39023.324600
40023.313600
41023.023900
42023.100000
43023.174100
44023.301800
45023.268000
46023.215000
47022.954800
48023.131900
49023.396800
50023.423600
51023.040500
52023.399400
53023.193900
54023.395100
55023.196200
56023.387200
57023.189700
58023.188200
59023.192300
60023.410800
61022.736500
62023.095600
63022.848800
64023.120600
65023.184200
66023.107900
67023.187900
68023.264400
69023.334400
70023.149400
71023.125700
72023.182100
73023.260400
74022.861800

" ] }, "metadata": {} } ] } ] }