Skip to content

Instantly share code, notes, and snippets.

@attentionmech
Created April 1, 2025 18:54
Show Gist options
  • Select an option

  • Save attentionmech/06d7852d8c7b21cb962ae006867cfe15 to your computer and use it in GitHub Desktop.

Select an option

Save attentionmech/06d7852d8c7b21cb962ae006867cfe15 to your computer and use it in GitHub Desktop.
attention-entropy.ipynb
Display the source blob
Display the rendered blob
Raw
{
"nbformat": 4,
"nbformat_minor": 0,
"metadata": {
"colab": {
"provenance": [],
"authorship_tag": "ABX9TyO8JWtHcUXJo5zkWBr66gRU",
"include_colab_link": true
},
"kernelspec": {
"name": "python3",
"display_name": "Python 3"
},
"language_info": {
"name": "python"
},
"widgets": {
"application/vnd.jupyter.widget-state+json": {
"993781067b5a419db89499a81830f9e5": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_d6429ffb94f74936b2351a6f61c1b4bd",
"IPY_MODEL_24458918a26040328739dba11c33d170",
"IPY_MODEL_5abf230fda73431487ba3791f2feabdd"
],
"layout": "IPY_MODEL_b26db6bc2ad14d61b6472b3dfd571461"
}
},
"d6429ffb94f74936b2351a6f61c1b4bd": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_398bcaa52582409da75567844a0d06f8",
"placeholder": "​",
"style": "IPY_MODEL_6b4b055317724d05869243a13b3239b5",
"value": "config.json: 100%"
}
},
"24458918a26040328739dba11c33d170": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_b6b5a02ea1434740874f45b3d2b878d3",
"max": 718,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_28a5e9ea489b4cc5a422c019663965cd",
"value": 718
}
},
"5abf230fda73431487ba3791f2feabdd": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_e0e645b02e194e579af566b5f23e1c14",
"placeholder": "​",
"style": "IPY_MODEL_3f8c1c7c5ebf4619a56928b2e1e9c383",
"value": " 718/718 [00:00<00:00, 38.9kB/s]"
}
},
"b26db6bc2ad14d61b6472b3dfd571461": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"398bcaa52582409da75567844a0d06f8": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"6b4b055317724d05869243a13b3239b5": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"b6b5a02ea1434740874f45b3d2b878d3": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"28a5e9ea489b4cc5a422c019663965cd": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"e0e645b02e194e579af566b5f23e1c14": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"3f8c1c7c5ebf4619a56928b2e1e9c383": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"bff16717ab2c45c184116cb96c0301d4": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_5b17b6ed8bd6494db2715f5fe7041856",
"IPY_MODEL_c7f50eac0b94486ca710099c8c0484b7",
"IPY_MODEL_e23fa22ce4dc46f0ac00e9e815d89a83"
],
"layout": "IPY_MODEL_d9b1d44b62e2472e9f83ba5497fa684b"
}
},
"5b17b6ed8bd6494db2715f5fe7041856": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_88ca130dcfcf4fcc9145d7ad68233156",
"placeholder": "​",
"style": "IPY_MODEL_77227d4f52714d8da08e8076121a9304",
"value": "model.safetensors: 100%"
}
},
"c7f50eac0b94486ca710099c8c0484b7": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_453c7b8147364353bf2cd67aac35162f",
"max": 1519984962,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_160d73334e6a463ca9ce3b977a6b43de",
"value": 1519984962
}
},
"e23fa22ce4dc46f0ac00e9e815d89a83": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_0f13035b4bc54099a6d8ebfed9da67c3",
"placeholder": "​",
"style": "IPY_MODEL_a2870fe2a5fd4e749583f7ea0216f536",
"value": " 1.52G/1.52G [00:11<00:00, 183MB/s]"
}
},
"d9b1d44b62e2472e9f83ba5497fa684b": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"88ca130dcfcf4fcc9145d7ad68233156": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"77227d4f52714d8da08e8076121a9304": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"453c7b8147364353bf2cd67aac35162f": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"160d73334e6a463ca9ce3b977a6b43de": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"0f13035b4bc54099a6d8ebfed9da67c3": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"a2870fe2a5fd4e749583f7ea0216f536": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"d821f61c3c134acc99c03a2127ce3176": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_dff86d3249e642f28d85e84b6c5fb9e0",
"IPY_MODEL_74c68dcbed49437bae70c45f94782a82",
"IPY_MODEL_c97ced10fd0a49df8b1554ce2e371669"
],
"layout": "IPY_MODEL_4c298c4bbb974063a0407ef9bfadacca"
}
},
"dff86d3249e642f28d85e84b6c5fb9e0": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_4cce811700884180944c627ec096ba42",
"placeholder": "​",
"style": "IPY_MODEL_339fd6cb492745029f281723f9bd7298",
"value": "generation_config.json: 100%"
}
},
"74c68dcbed49437bae70c45f94782a82": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_bc942c268beb49f9b76cb83c1ef0cac8",
"max": 124,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_df8c39584e80433583ae01030763e463",
"value": 124
}
},
"c97ced10fd0a49df8b1554ce2e371669": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_de9a712c25eb4eaba4bae8f99c01d953",
"placeholder": "​",
"style": "IPY_MODEL_644bb0aadf3d446e85f02f6bfb94ee4d",
"value": " 124/124 [00:00<00:00, 7.82kB/s]"
}
},
"4c298c4bbb974063a0407ef9bfadacca": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"4cce811700884180944c627ec096ba42": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"339fd6cb492745029f281723f9bd7298": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"bc942c268beb49f9b76cb83c1ef0cac8": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"df8c39584e80433583ae01030763e463": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"de9a712c25eb4eaba4bae8f99c01d953": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"644bb0aadf3d446e85f02f6bfb94ee4d": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"0c348bb0d5b84fd69414809aaffd3157": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_e238d3a0721441c9aa704955977225bf",
"IPY_MODEL_d338b6a3facf44038ae2c422a612417a",
"IPY_MODEL_c5a6bb2e549640c6ba355b156d4e95f8"
],
"layout": "IPY_MODEL_f2b4798f73cb4dc98576c1b75e2d3e18"
}
},
"e238d3a0721441c9aa704955977225bf": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_24a53f06b67b44c1a4860fc8b485fd32",
"placeholder": "​",
"style": "IPY_MODEL_1db6c011ab024d47b15239b6ed2d9a3b",
"value": "tokenizer_config.json: 100%"
}
},
"d338b6a3facf44038ae2c422a612417a": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_618453aa3c384a0e81b3b38958d018e2",
"max": 26,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_7b6b71135e5a4feb80b395f6a0ef77ca",
"value": 26
}
},
"c5a6bb2e549640c6ba355b156d4e95f8": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_e813507a82864a1bb5ce60258ec9ce50",
"placeholder": "​",
"style": "IPY_MODEL_a7808bd8550b4a95ada92083689ef01a",
"value": " 26.0/26.0 [00:00<00:00, 1.42kB/s]"
}
},
"f2b4798f73cb4dc98576c1b75e2d3e18": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"24a53f06b67b44c1a4860fc8b485fd32": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"1db6c011ab024d47b15239b6ed2d9a3b": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"618453aa3c384a0e81b3b38958d018e2": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"7b6b71135e5a4feb80b395f6a0ef77ca": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"e813507a82864a1bb5ce60258ec9ce50": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"a7808bd8550b4a95ada92083689ef01a": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"fd6f88b3a0444675a6f969c685122169": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_a814a6343dbb458a9c1a71c745ba37bd",
"IPY_MODEL_dd76ce1c6ab4407db0c07ba7a6ebf21f",
"IPY_MODEL_782fe8b951b648a4bbaa9bd6518b3b9e"
],
"layout": "IPY_MODEL_3a05ef60b9694687b99c8eb32af51d45"
}
},
"a814a6343dbb458a9c1a71c745ba37bd": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_5d8d800069924b2093d17cbbc65efa02",
"placeholder": "​",
"style": "IPY_MODEL_82a657631afe4e40b98b3a27e1a4eb28",
"value": "vocab.json: 100%"
}
},
"dd76ce1c6ab4407db0c07ba7a6ebf21f": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_03fc14c12b9c429ebd275c4a9cfa63a7",
"max": 1042301,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_014085dd6a6242e0ad5f41e2d837c7ef",
"value": 1042301
}
},
"782fe8b951b648a4bbaa9bd6518b3b9e": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_f187ee7dc5864fdf81434076faf4ea72",
"placeholder": "​",
"style": "IPY_MODEL_2c5fa4b33a7c49dca42ee51c59fdf5f8",
"value": " 1.04M/1.04M [00:00<00:00, 13.2MB/s]"
}
},
"3a05ef60b9694687b99c8eb32af51d45": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"5d8d800069924b2093d17cbbc65efa02": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"82a657631afe4e40b98b3a27e1a4eb28": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"03fc14c12b9c429ebd275c4a9cfa63a7": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"014085dd6a6242e0ad5f41e2d837c7ef": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"f187ee7dc5864fdf81434076faf4ea72": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"2c5fa4b33a7c49dca42ee51c59fdf5f8": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"f5da466bd5064322b7212edf94e4e909": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_37d316020f72474396a94dc933008f5d",
"IPY_MODEL_3c764ee93e4f4504acf465ca95fe8589",
"IPY_MODEL_d57d02edbfd949a1b6367dad22bce207"
],
"layout": "IPY_MODEL_8fa7adfb99f94fefb529c22659b5eeb4"
}
},
"37d316020f72474396a94dc933008f5d": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_8b5a121090bc4c4aafc0ada196331ab8",
"placeholder": "​",
"style": "IPY_MODEL_83218c0bb6b24b97a187a7e071396a57",
"value": "merges.txt: 100%"
}
},
"3c764ee93e4f4504acf465ca95fe8589": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_0e65350063224fc6b2576a02ac8f94dd",
"max": 456318,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_df9472b41e8741a8aa923378280c95db",
"value": 456318
}
},
"d57d02edbfd949a1b6367dad22bce207": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_ed6f98267f014aa7aa910c19f3f9b47a",
"placeholder": "​",
"style": "IPY_MODEL_aa6398d077dc4e17a1493b3d01e4b396",
"value": " 456k/456k [00:00<00:00, 13.7MB/s]"
}
},
"8fa7adfb99f94fefb529c22659b5eeb4": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"8b5a121090bc4c4aafc0ada196331ab8": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"83218c0bb6b24b97a187a7e071396a57": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"0e65350063224fc6b2576a02ac8f94dd": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"df9472b41e8741a8aa923378280c95db": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"ed6f98267f014aa7aa910c19f3f9b47a": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"aa6398d077dc4e17a1493b3d01e4b396": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"31087ce143ad41e4b57c2a0aba8da5e4": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HBoxModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HBoxModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HBoxView",
"box_style": "",
"children": [
"IPY_MODEL_c58668ce8d7b46b4b71a3bfd877e74d8",
"IPY_MODEL_44541efbca514545ba007dfb01c144e3",
"IPY_MODEL_7228f19608014a12b597979c966ec4d1"
],
"layout": "IPY_MODEL_d9f43306a3f94472b2a9accd53f59a4f"
}
},
"c58668ce8d7b46b4b71a3bfd877e74d8": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_2f792a7b2fb7402aae3ad7a84e04d0c0",
"placeholder": "​",
"style": "IPY_MODEL_a7495736ce2949e9b46186ebb53db72b",
"value": "tokenizer.json: 100%"
}
},
"44541efbca514545ba007dfb01c144e3": {
"model_module": "@jupyter-widgets/controls",
"model_name": "FloatProgressModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "FloatProgressModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "ProgressView",
"bar_style": "success",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_ec185e6414ac47818cc382da79a56c30",
"max": 1355256,
"min": 0,
"orientation": "horizontal",
"style": "IPY_MODEL_2c7a18970cc44e97852a268a18850465",
"value": 1355256
}
},
"7228f19608014a12b597979c966ec4d1": {
"model_module": "@jupyter-widgets/controls",
"model_name": "HTMLModel",
"model_module_version": "1.5.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "HTMLModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/controls",
"_view_module_version": "1.5.0",
"_view_name": "HTMLView",
"description": "",
"description_tooltip": null,
"layout": "IPY_MODEL_9dd9be8d29464f52ac2d4450283e9346",
"placeholder": "​",
"style": "IPY_MODEL_f39a38c9253c4a53918e2a163781ee58",
"value": " 1.36M/1.36M [00:00<00:00, 29.3MB/s]"
}
},
"d9f43306a3f94472b2a9accd53f59a4f": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"2f792a7b2fb7402aae3ad7a84e04d0c0": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"a7495736ce2949e9b46186ebb53db72b": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"ec185e6414ac47818cc382da79a56c30": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"2c7a18970cc44e97852a268a18850465": {
"model_module": "@jupyter-widgets/controls",
"model_name": "ProgressStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "ProgressStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"bar_color": null,
"description_width": ""
}
},
"9dd9be8d29464f52ac2d4450283e9346": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
},
"f39a38c9253c4a53918e2a163781ee58": {
"model_module": "@jupyter-widgets/controls",
"model_name": "DescriptionStyleModel",
"model_module_version": "1.5.0",
"state": {
"_model_module": "@jupyter-widgets/controls",
"_model_module_version": "1.5.0",
"_model_name": "DescriptionStyleModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "StyleView",
"description_width": ""
}
},
"6daaa2b7370a4cd4bc4c5d5fa80d49c5": {
"model_module": "@jupyter-widgets/output",
"model_name": "OutputModel",
"model_module_version": "1.0.0",
"state": {
"_dom_classes": [],
"_model_module": "@jupyter-widgets/output",
"_model_module_version": "1.0.0",
"_model_name": "OutputModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/output",
"_view_module_version": "1.0.0",
"_view_name": "OutputView",
"layout": "IPY_MODEL_d415ff0a1782430d81a3328f821ea1c4",
"msg_id": "",
"outputs": [
{
"output_type": "display_data",
"data": {
"text/plain": "\u001b[37m╭─────────────────────────────────────────────────────────────────────────────────────────────────────────────────╮\u001b[0m\n\u001b[37m│\u001b[0m | OpenMAV v0.0.12 | model: gpt2-medium \u001b[37m│\u001b[0m\n\u001b[37m╰─────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯\u001b[0m\n\u001b[35m╭─\u001b[0m\u001b[35m──────────────────────────────────────────────\u001b[0m\u001b[35m Attention Entropy \u001b[0m\u001b[35m──────────────────────────────────────────────\u001b[0m\u001b[35m─╮\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 1\u001b[0m | \u001b[1;33m:\u001b[0m [█████████████████████████████████████████████████ ] 4.0 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 2\u001b[0m | \u001b[1;33m:\u001b[0m [██████████████████████████████████████████████████] 4.0 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 3\u001b[0m | \u001b[1;33m:\u001b[0m [███████████████████████████████████ ] 2.8 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 4\u001b[0m | \u001b[1;33m:\u001b[0m [████████████████████████████ ] 2.3 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 5\u001b[0m | \u001b[1;33m:\u001b[0m [████████████████████████ ] 1.9 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 6\u001b[0m | \u001b[1;33m:\u001b[0m [█████████████████████ ] 1.7 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 7\u001b[0m | \u001b[1;33m:\u001b[0m [████████████████ ] 1.3 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 8\u001b[0m | \u001b[1;33m:\u001b[0m [███████████████████ ] 1.6 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 9\u001b[0m | \u001b[1;33m:\u001b[0m [█████████████████████████ ] 2.1 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 10\u001b[0m | \u001b[1;33m:\u001b[0m [█████████████████ ] 1.4 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 11\u001b[0m | \u001b[1;33m:\u001b[0m [███████████████████████ ] 1.9 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 12\u001b[0m | \u001b[1;33m:\u001b[0m [█████████████████████ ] 1.7 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 13\u001b[0m | \u001b[1;33m:\u001b[0m [██████████████████ ] 1.5 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 14\u001b[0m | \u001b[1;33m:\u001b[0m [████████████████████ ] 1.6 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 15\u001b[0m | \u001b[1;33m:\u001b[0m [██████████████████ ] 1.5 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 16\u001b[0m | \u001b[1;33m:\u001b[0m [██████████████████████████ ] 2.1 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 17\u001b[0m | \u001b[1;33m:\u001b[0m [███████████████████ ] 1.6 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 18\u001b[0m | \u001b[1;33m:\u001b[0m [██████████████████████ ] 1.8 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 19\u001b[0m | \u001b[1;33m:\u001b[0m [███████████████████ ] 1.6 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 20\u001b[0m | \u001b[1;33m:\u001b[0m [███████████████████████ ] 1.8 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 21\u001b[0m | \u001b[1;33m:\u001b[0m [███████████████████████ ] 1.8 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 22\u001b[0m | \u001b[1;33m:\u001b[0m [██████████████████ ] 1.5 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 23\u001b[0m | \u001b[1;33m:\u001b[0m [███████████████████████████████ ] 2.5 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[1;37mLayer 24\u001b[0m | \u001b[1;33m:\u001b[0m [██████████████████████████████████████ ] 3.1 \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m│\u001b[0m \u001b[35m│\u001b[0m\n\u001b[35m╰─────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯\u001b[0m\n",
"text/html": "<pre style=\"white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace\"><span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0\">╭─────────────────────────────────────────────────────────────────────────────────────────────────────────────────╮</span>\n<span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0\">│</span> | OpenMAV v0.0.12 | model: gpt2-medium <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0\">│</span>\n<span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0\">╰─────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">╭─────────────────────────────────────────────── Attention Entropy ───────────────────────────────────────────────╮</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 1</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [█████████████████████████████████████████████████ ] 4.0 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 2</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [██████████████████████████████████████████████████] 4.0 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 3</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [███████████████████████████████████ ] 2.8 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 4</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [████████████████████████████ ] 2.3 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 5</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [████████████████████████ ] 1.9 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 6</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [█████████████████████ ] 1.7 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 7</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [████████████████ ] 1.3 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 8</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [███████████████████ ] 1.6 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 9</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [█████████████████████████ ] 2.1 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 10</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [█████████████████ ] 1.4 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 11</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [███████████████████████ ] 1.9 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 12</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [█████████████████████ ] 1.7 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 13</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [██████████████████ ] 1.5 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 14</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [████████████████████ ] 1.6 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 15</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [██████████████████ ] 1.5 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 16</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [██████████████████████████ ] 2.1 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 17</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [███████████████████ ] 1.6 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 18</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [██████████████████████ ] 1.8 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 19</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [███████████████████ ] 1.6 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 20</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [███████████████████████ ] 1.8 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 21</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [███████████████████████ ] 1.8 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 22</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [██████████████████ ] 1.5 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 23</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [███████████████████████████████ ] 2.5 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #c0c0c0; text-decoration-color: #c0c0c0; font-weight: bold\">Layer 24</span> | <span style=\"color: #808000; text-decoration-color: #808000; font-weight: bold\">:</span> [██████████████████████████████████████ ] 3.1 <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">│</span> <span style=\"color: #800080; text-decoration-color: #800080\">│</span>\n<span style=\"color: #800080; text-decoration-color: #800080\">╰─────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯</span>\n</pre>\n"
},
"metadata": {}
}
]
}
},
"d415ff0a1782430d81a3328f821ea1c4": {
"model_module": "@jupyter-widgets/base",
"model_name": "LayoutModel",
"model_module_version": "1.2.0",
"state": {
"_model_module": "@jupyter-widgets/base",
"_model_module_version": "1.2.0",
"_model_name": "LayoutModel",
"_view_count": null,
"_view_module": "@jupyter-widgets/base",
"_view_module_version": "1.2.0",
"_view_name": "LayoutView",
"align_content": null,
"align_items": null,
"align_self": null,
"border": null,
"bottom": null,
"display": null,
"flex": null,
"flex_flow": null,
"grid_area": null,
"grid_auto_columns": null,
"grid_auto_flow": null,
"grid_auto_rows": null,
"grid_column": null,
"grid_gap": null,
"grid_row": null,
"grid_template_areas": null,
"grid_template_columns": null,
"grid_template_rows": null,
"height": null,
"justify_content": null,
"justify_items": null,
"left": null,
"margin": null,
"max_height": null,
"max_width": null,
"min_height": null,
"min_width": null,
"object_fit": null,
"object_position": null,
"order": null,
"overflow": null,
"overflow_x": null,
"overflow_y": null,
"padding": null,
"right": null,
"top": null,
"visibility": null,
"width": null
}
}
}
}
},
"cells": [
{
"cell_type": "markdown",
"metadata": {
"id": "view-in-github",
"colab_type": "text"
},
"source": [
"<a href=\"https://colab.research.google.com/gist/attentionmech/06d7852d8c7b21cb962ae006867cfe15/attention-entropy.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/"
},
"id": "WoVpfgsQrIvn",
"outputId": "00974d11-0e8c-4198-9153-de00896431d9"
},
"outputs": [
{
"output_type": "stream",
"name": "stdout",
"text": [
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m363.4/363.4 MB\u001b[0m \u001b[31m4.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m13.8/13.8 MB\u001b[0m \u001b[31m63.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m24.6/24.6 MB\u001b[0m \u001b[31m46.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m883.7/883.7 kB\u001b[0m \u001b[31m28.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m664.8/664.8 MB\u001b[0m \u001b[31m2.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m211.5/211.5 MB\u001b[0m \u001b[31m5.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m56.3/56.3 MB\u001b[0m \u001b[31m12.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m127.9/127.9 MB\u001b[0m \u001b[31m7.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m207.5/207.5 MB\u001b[0m \u001b[31m6.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m21.1/21.1 MB\u001b[0m \u001b[31m78.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
"\u001b[?25h"
]
}
],
"source": [
"!python -m pip install -q openmav"
]
},
{
"cell_type": "code",
"source": [
"from openmav.mav import MAV\n",
"\n",
"MAV(\"gpt2-medium\",\"once upon a time\", selected_panels=[\"attention_entropy\"], num_grid_rows=1)"
],
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 1000,
"referenced_widgets": [
"993781067b5a419db89499a81830f9e5",
"d6429ffb94f74936b2351a6f61c1b4bd",
"24458918a26040328739dba11c33d170",
"5abf230fda73431487ba3791f2feabdd",
"b26db6bc2ad14d61b6472b3dfd571461",
"398bcaa52582409da75567844a0d06f8",
"6b4b055317724d05869243a13b3239b5",
"b6b5a02ea1434740874f45b3d2b878d3",
"28a5e9ea489b4cc5a422c019663965cd",
"e0e645b02e194e579af566b5f23e1c14",
"3f8c1c7c5ebf4619a56928b2e1e9c383",
"bff16717ab2c45c184116cb96c0301d4",
"5b17b6ed8bd6494db2715f5fe7041856",
"c7f50eac0b94486ca710099c8c0484b7",
"e23fa22ce4dc46f0ac00e9e815d89a83",
"d9b1d44b62e2472e9f83ba5497fa684b",
"88ca130dcfcf4fcc9145d7ad68233156",
"77227d4f52714d8da08e8076121a9304",
"453c7b8147364353bf2cd67aac35162f",
"160d73334e6a463ca9ce3b977a6b43de",
"0f13035b4bc54099a6d8ebfed9da67c3",
"a2870fe2a5fd4e749583f7ea0216f536",
"d821f61c3c134acc99c03a2127ce3176",
"dff86d3249e642f28d85e84b6c5fb9e0",
"74c68dcbed49437bae70c45f94782a82",
"c97ced10fd0a49df8b1554ce2e371669",
"4c298c4bbb974063a0407ef9bfadacca",
"4cce811700884180944c627ec096ba42",
"339fd6cb492745029f281723f9bd7298",
"bc942c268beb49f9b76cb83c1ef0cac8",
"df8c39584e80433583ae01030763e463",
"de9a712c25eb4eaba4bae8f99c01d953",
"644bb0aadf3d446e85f02f6bfb94ee4d",
"0c348bb0d5b84fd69414809aaffd3157",
"e238d3a0721441c9aa704955977225bf",
"d338b6a3facf44038ae2c422a612417a",
"c5a6bb2e549640c6ba355b156d4e95f8",
"f2b4798f73cb4dc98576c1b75e2d3e18",
"24a53f06b67b44c1a4860fc8b485fd32",
"1db6c011ab024d47b15239b6ed2d9a3b",
"618453aa3c384a0e81b3b38958d018e2",
"7b6b71135e5a4feb80b395f6a0ef77ca",
"e813507a82864a1bb5ce60258ec9ce50",
"a7808bd8550b4a95ada92083689ef01a",
"fd6f88b3a0444675a6f969c685122169",
"a814a6343dbb458a9c1a71c745ba37bd",
"dd76ce1c6ab4407db0c07ba7a6ebf21f",
"782fe8b951b648a4bbaa9bd6518b3b9e",
"3a05ef60b9694687b99c8eb32af51d45",
"5d8d800069924b2093d17cbbc65efa02",
"82a657631afe4e40b98b3a27e1a4eb28",
"03fc14c12b9c429ebd275c4a9cfa63a7",
"014085dd6a6242e0ad5f41e2d837c7ef",
"f187ee7dc5864fdf81434076faf4ea72",
"2c5fa4b33a7c49dca42ee51c59fdf5f8",
"f5da466bd5064322b7212edf94e4e909",
"37d316020f72474396a94dc933008f5d",
"3c764ee93e4f4504acf465ca95fe8589",
"d57d02edbfd949a1b6367dad22bce207",
"8fa7adfb99f94fefb529c22659b5eeb4",
"8b5a121090bc4c4aafc0ada196331ab8",
"83218c0bb6b24b97a187a7e071396a57",
"0e65350063224fc6b2576a02ac8f94dd",
"df9472b41e8741a8aa923378280c95db",
"ed6f98267f014aa7aa910c19f3f9b47a",
"aa6398d077dc4e17a1493b3d01e4b396",
"31087ce143ad41e4b57c2a0aba8da5e4",
"c58668ce8d7b46b4b71a3bfd877e74d8",
"44541efbca514545ba007dfb01c144e3",
"7228f19608014a12b597979c966ec4d1",
"d9f43306a3f94472b2a9accd53f59a4f",
"2f792a7b2fb7402aae3ad7a84e04d0c0",
"a7495736ce2949e9b46186ebb53db72b",
"ec185e6414ac47818cc382da79a56c30",
"2c7a18970cc44e97852a268a18850465",
"9dd9be8d29464f52ac2d4450283e9346",
"f39a38c9253c4a53918e2a163781ee58",
"6daaa2b7370a4cd4bc4c5d5fa80d49c5",
"d415ff0a1782430d81a3328f821ea1c4"
]
},
"id": "k-kdhVqjrab7",
"outputId": "256f2917-3396-4f03-c048-9cb65cd1133f"
},
"execution_count": null,
"outputs": [
{
"output_type": "display_data",
"data": {
"text/plain": [
"config.json: 0%| | 0.00/718 [00:00<?, ?B/s]"
],
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
"model_id": "993781067b5a419db89499a81830f9e5"
}
},
"metadata": {}
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"model.safetensors: 0%| | 0.00/1.52G [00:00<?, ?B/s]"
],
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
"model_id": "bff16717ab2c45c184116cb96c0301d4"
}
},
"metadata": {}
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"generation_config.json: 0%| | 0.00/124 [00:00<?, ?B/s]"
],
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
"model_id": "d821f61c3c134acc99c03a2127ce3176"
}
},
"metadata": {}
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"tokenizer_config.json: 0%| | 0.00/26.0 [00:00<?, ?B/s]"
],
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
"model_id": "0c348bb0d5b84fd69414809aaffd3157"
}
},
"metadata": {}
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"vocab.json: 0%| | 0.00/1.04M [00:00<?, ?B/s]"
],
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
"model_id": "fd6f88b3a0444675a6f969c685122169"
}
},
"metadata": {}
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"merges.txt: 0%| | 0.00/456k [00:00<?, ?B/s]"
],
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
"model_id": "f5da466bd5064322b7212edf94e4e909"
}
},
"metadata": {}
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"tokenizer.json: 0%| | 0.00/1.36M [00:00<?, ?B/s]"
],
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
"model_id": "31087ce143ad41e4b57c2a0aba8da5e4"
}
},
"metadata": {}
},
{
"output_type": "stream",
"name": "stderr",
"text": [
"The attention mask is not set and cannot be inferred from input because pad token is same as eos token. As a consequence, you may observe unexpected behavior. Please pass your input's `attention_mask` to obtain reliable results.\n"
]
},
{
"output_type": "display_data",
"data": {
"text/plain": [
"Output()"
],
"application/vnd.jupyter.widget-view+json": {
"version_major": 2,
"version_minor": 0,
"model_id": "6daaa2b7370a4cd4bc4c5d5fa80d49c5"
}
},
"metadata": {}
},
{
"output_type": "display_data",
"data": {
"text/plain": [],
"text/html": [
"<pre style=\"white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace\"></pre>\n"
]
},
"metadata": {}
},
{
"output_type": "error",
"ename": "KeyboardInterrupt",
"evalue": "",
"traceback": [
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
"\u001b[0;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)",
"\u001b[0;32m<ipython-input-3-a7efc84f8e42>\u001b[0m in \u001b[0;36m<cell line: 0>\u001b[0;34m()\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[0;32mfrom\u001b[0m \u001b[0mopenmav\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmav\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0mMAV\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 3\u001b[0;31m \u001b[0mMAV\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"gpt2-medium\"\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\"once upon a time\"\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mselected_panels\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m\"attention_entropy\"\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnum_grid_rows\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/openmav/mav.py\u001b[0m in \u001b[0;36mMAV\u001b[0;34m(model, prompt, max_new_tokens, limit_chars, temp, top_k, top_p, min_p, repetition_penalty, aggregation, refresh_rate, interactive, selected_panels, num_grid_rows, max_bar_length, device, scale, backend, seed, model_obj, tokenizer_obj, external_panels)\u001b[0m\n\u001b[1;32m 96\u001b[0m )\n\u001b[1;32m 97\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 98\u001b[0;31m \u001b[0mmanager\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstate_loop\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mprompt\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 99\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 100\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/openmav/view/main_loop_manager.py\u001b[0m in \u001b[0;36mstate_loop\u001b[0;34m(self, prompt)\u001b[0m\n\u001b[1;32m 72\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 73\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 74\u001b[0;31m for data in self.state_provider.fetch_next(\n\u001b[0m\u001b[1;32m 75\u001b[0m \u001b[0mprompt\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 76\u001b[0m \u001b[0mtemperature\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtemperature\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/openmav/processors/state_fetcher.py\u001b[0m in \u001b[0;36mfetch_next\u001b[0;34m(self, prompt, temperature, top_k, top_p, min_p, repetition_penalty)\u001b[0m\n\u001b[1;32m 41\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 42\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0m_\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mrange\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mmax_new_tokens\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 43\u001b[0;31m outputs = self.backend.generate(\n\u001b[0m\u001b[1;32m 44\u001b[0m \u001b[0mgenerated_ids\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 45\u001b[0m \u001b[0mtemperature\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mtemperature\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/openmav/backends/model_backend_transformers.py\u001b[0m in \u001b[0;36mgenerate\u001b[0;34m(self, input_ids, temperature, top_k, top_p, min_p, repetition_penalty)\u001b[0m\n\u001b[1;32m 63\u001b[0m \u001b[0minput_tensor\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtorch\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtensor\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0minput_ids\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdevice\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 64\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mtorch\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mno_grad\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 65\u001b[0;31m outputs = self.model.generate(\n\u001b[0m\u001b[1;32m 66\u001b[0m \u001b[0minput_tensor\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 67\u001b[0m \u001b[0mdo_sample\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mtemperature\u001b[0m \u001b[0;34m>\u001b[0m \u001b[0;36m0\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/torch/utils/_contextlib.py\u001b[0m in \u001b[0;36mdecorate_context\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 114\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mdecorate_context\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 115\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mctx_factory\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 116\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 117\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 118\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mdecorate_context\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/transformers/generation/utils.py\u001b[0m in \u001b[0;36mgenerate\u001b[0;34m(self, inputs, generation_config, logits_processor, stopping_criteria, prefix_allowed_tokens_fn, synced_gpus, assistant_model, streamer, negative_prompt_ids, negative_prompt_attention_mask, use_model_defaults, **kwargs)\u001b[0m\n\u001b[1;32m 2324\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2325\u001b[0m \u001b[0;31m# 12. run sample (it degenerates to greedy search when `generation_config.do_sample=False`)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 2326\u001b[0;31m result = self._sample(\n\u001b[0m\u001b[1;32m 2327\u001b[0m \u001b[0minput_ids\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 2328\u001b[0m \u001b[0mlogits_processor\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mprepared_logits_processor\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/transformers/generation/utils.py\u001b[0m in \u001b[0;36m_sample\u001b[0;34m(self, input_ids, logits_processor, stopping_criteria, generation_config, synced_gpus, streamer, **model_kwargs)\u001b[0m\n\u001b[1;32m 3284\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 3285\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mis_prefill\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 3286\u001b[0;31m \u001b[0moutputs\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m**\u001b[0m\u001b[0mmodel_inputs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mreturn_dict\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 3287\u001b[0m \u001b[0mis_prefill\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mFalse\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 3288\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/torch/nn/modules/module.py\u001b[0m in \u001b[0;36m_wrapped_call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m 1737\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_compiled_call_impl\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;31m# type: ignore[misc]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1738\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1739\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_call_impl\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1740\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1741\u001b[0m \u001b[0;31m# torchrec tests the code consistency with the following code\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/torch/nn/modules/module.py\u001b[0m in \u001b[0;36m_call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m 1748\u001b[0m \u001b[0;32mor\u001b[0m \u001b[0m_global_backward_pre_hooks\u001b[0m \u001b[0;32mor\u001b[0m \u001b[0m_global_backward_hooks\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1749\u001b[0m or _global_forward_hooks or _global_forward_pre_hooks):\n\u001b[0;32m-> 1750\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mforward_call\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1751\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1752\u001b[0m \u001b[0mresult\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/transformers/models/gpt2/modeling_gpt2.py\u001b[0m in \u001b[0;36mforward\u001b[0;34m(self, input_ids, past_key_values, attention_mask, token_type_ids, position_ids, head_mask, inputs_embeds, encoder_hidden_states, encoder_attention_mask, labels, use_cache, output_attentions, output_hidden_states, return_dict, **kwargs)\u001b[0m\n\u001b[1;32m 1082\u001b[0m \u001b[0mhidden_states\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mhidden_states\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mlm_head\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mweight\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdevice\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1083\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1084\u001b[0;31m \u001b[0mlm_logits\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mlm_head\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mhidden_states\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1085\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1086\u001b[0m \u001b[0mloss\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/torch/nn/modules/module.py\u001b[0m in \u001b[0;36m_wrapped_call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m 1737\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_compiled_call_impl\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;31m# type: ignore[misc]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1738\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1739\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_call_impl\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1740\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1741\u001b[0m \u001b[0;31m# torchrec tests the code consistency with the following code\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/torch/nn/modules/module.py\u001b[0m in \u001b[0;36m_call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m 1748\u001b[0m \u001b[0;32mor\u001b[0m \u001b[0m_global_backward_pre_hooks\u001b[0m \u001b[0;32mor\u001b[0m \u001b[0m_global_backward_hooks\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1749\u001b[0m or _global_forward_hooks or _global_forward_pre_hooks):\n\u001b[0;32m-> 1750\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mforward_call\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 1751\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1752\u001b[0m \u001b[0mresult\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;32m/usr/local/lib/python3.11/dist-packages/torch/nn/modules/linear.py\u001b[0m in \u001b[0;36mforward\u001b[0;34m(self, input)\u001b[0m\n\u001b[1;32m 123\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 124\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mforward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0minput\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mTensor\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m->\u001b[0m \u001b[0mTensor\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 125\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mF\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mlinear\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0minput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mweight\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbias\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 126\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 127\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mextra_repr\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m->\u001b[0m \u001b[0mstr\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;31mKeyboardInterrupt\u001b[0m: "
]
}
]
},
{
"cell_type": "code",
"source": [],
"metadata": {
"id": "biELPlICsPVt"
},
"execution_count": null,
"outputs": []
}
]
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment