diff --git "a/tester_colab.ipynb" "b/tester_colab.ipynb" new file mode 100644--- /dev/null +++ "b/tester_colab.ipynb" @@ -0,0 +1,1798 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [] + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + }, + "widgets": { + "application/vnd.jupyter.widget-state+json": { + "65c70bc500eb48f5a3f664634c9abcb8": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HBoxModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HBoxModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HBoxView", + "box_style": "", + "children": [ + "IPY_MODEL_e03b82ed14aa4f72a98fb62f1b9c1772", + "IPY_MODEL_53daa6d66f3644a2836c1f6e5fefbec2", + "IPY_MODEL_4dd5a724ed7d4fa4ba53723176e008b3" + ], + "layout": "IPY_MODEL_7452489dd0df4407b70ab4e00f5a3647" + } + }, + "e03b82ed14aa4f72a98fb62f1b9c1772": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_29229fdd1a7840099d95a7d0f9164a37", + "placeholder": "​", + "style": "IPY_MODEL_917f0a55fb974d3dae0b6ce1cf9cf431", + "value": "100%" + } + }, + "53daa6d66f3644a2836c1f6e5fefbec2": { + "model_module": "@jupyter-widgets/controls", + "model_name": "FloatProgressModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "FloatProgressModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "ProgressView", + "bar_style": "success", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_4f2dde1811344bf8b6a2c5630107b27c", + "max": 93171529, + "min": 0, + "orientation": "horizontal", + "style": "IPY_MODEL_d8cf02c364984d77a6d0f104468493fe", + "value": 93171529 + } + }, + "4dd5a724ed7d4fa4ba53723176e008b3": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_283cb331d5be41a6a2804804ab4157f8", + "placeholder": "​", + "style": "IPY_MODEL_8dea68cdeab940c6a8848b29fb0acc15", + "value": " 88.9M/88.9M [00:01<00:00, 108MB/s]" + } + }, + "7452489dd0df4407b70ab4e00f5a3647": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "29229fdd1a7840099d95a7d0f9164a37": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "917f0a55fb974d3dae0b6ce1cf9cf431": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "4f2dde1811344bf8b6a2c5630107b27c": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "d8cf02c364984d77a6d0f104468493fe": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "ProgressStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "bar_color": null, + "description_width": "" + } + }, + "283cb331d5be41a6a2804804ab4157f8": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "8dea68cdeab940c6a8848b29fb0acc15": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "3c22fa692f674ef4b278928f18cb2e25": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HBoxModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HBoxModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HBoxView", + "box_style": "", + "children": [ + "IPY_MODEL_c8ccf1019747488b81f89037eca5fbc8", + "IPY_MODEL_2b0b5807a9ef4469b1743900110a66d6", + "IPY_MODEL_adddef9c7f69491894a6449cb568e1c5" + ], + "layout": "IPY_MODEL_53fa963136ee49e9b29a7ec9355dd68b" + } + }, + "c8ccf1019747488b81f89037eca5fbc8": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_ba8fba46da4646c99abd88eb4060e10d", + "placeholder": "​", + "style": "IPY_MODEL_b35da4e51cca44ab873c63670744d70c", + "value": "Downloading (…)lve/main/config.yaml: 100%" + } + }, + "2b0b5807a9ef4469b1743900110a66d6": { + "model_module": "@jupyter-widgets/controls", + "model_name": "FloatProgressModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "FloatProgressModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "ProgressView", + "bar_style": "success", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_8f8ee8e8131c454d926827ca952a7a32", + "max": 503, + "min": 0, + "orientation": "horizontal", + "style": "IPY_MODEL_f0dc52160c87446ea60b76e1d7c7decf", + "value": 503 + } + }, + "adddef9c7f69491894a6449cb568e1c5": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_9099eec49e5a40e09956e32fff04f01e", + "placeholder": "​", + "style": "IPY_MODEL_21c102c08fab49acb2b0b9a3f62f1a43", + "value": " 503/503 [00:00<00:00, 16.1kB/s]" + } + }, + "53fa963136ee49e9b29a7ec9355dd68b": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "ba8fba46da4646c99abd88eb4060e10d": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "b35da4e51cca44ab873c63670744d70c": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "8f8ee8e8131c454d926827ca952a7a32": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "f0dc52160c87446ea60b76e1d7c7decf": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "ProgressStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "bar_color": null, + "description_width": "" + } + }, + "9099eec49e5a40e09956e32fff04f01e": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "21c102c08fab49acb2b0b9a3f62f1a43": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "c1dd8f5b533d4f018a47eb72bc12bab9": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HBoxModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HBoxModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HBoxView", + "box_style": "", + "children": [ + "IPY_MODEL_0e0384525e8d48b290250099ee19c673", + "IPY_MODEL_f5e0db29e9654975b32c82598a7e0b7e", + "IPY_MODEL_ddaa862b183f46a5947e552ed765206c" + ], + "layout": "IPY_MODEL_9634a4f60ff14e7a8c1a8cff38ef9954" + } + }, + "0e0384525e8d48b290250099ee19c673": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_f7ca8116da184a6c89faa834e1d50b1b", + "placeholder": "​", + "style": "IPY_MODEL_535675fafe0644c7ace668fe263f8e03", + "value": "Downloading pytorch_model.bin: 100%" + } + }, + "f5e0db29e9654975b32c82598a7e0b7e": { + "model_module": "@jupyter-widgets/controls", + "model_name": "FloatProgressModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "FloatProgressModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "ProgressView", + "bar_style": "success", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_5c8f17eec77b425f8f14a1ac9a8407ed", + "max": 40356199, + "min": 0, + "orientation": "horizontal", + "style": "IPY_MODEL_85b19f90c93748b0ba2ef5e936912456", + "value": 40356199 + } + }, + "ddaa862b183f46a5947e552ed765206c": { + "model_module": "@jupyter-widgets/controls", + "model_name": "HTMLModel", + "model_module_version": "1.5.0", + "state": { + "_dom_classes": [], + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "HTMLModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/controls", + "_view_module_version": "1.5.0", + "_view_name": "HTMLView", + "description": "", + "description_tooltip": null, + "layout": "IPY_MODEL_309077bf93fe469f96bfc657ea5dd520", + "placeholder": "​", + "style": "IPY_MODEL_e0191f86888d4331a71009c62777dd87", + "value": " 40.4M/40.4M [00:00<00:00, 85.5MB/s]" + } + }, + "9634a4f60ff14e7a8c1a8cff38ef9954": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "f7ca8116da184a6c89faa834e1d50b1b": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "535675fafe0644c7ace668fe263f8e03": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + }, + "5c8f17eec77b425f8f14a1ac9a8407ed": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "85b19f90c93748b0ba2ef5e936912456": { + "model_module": "@jupyter-widgets/controls", + "model_name": "ProgressStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "ProgressStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "bar_color": null, + "description_width": "" + } + }, + "309077bf93fe469f96bfc657ea5dd520": { + "model_module": "@jupyter-widgets/base", + "model_name": "LayoutModel", + "model_module_version": "1.2.0", + "state": { + "_model_module": "@jupyter-widgets/base", + "_model_module_version": "1.2.0", + "_model_name": "LayoutModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "LayoutView", + "align_content": null, + "align_items": null, + "align_self": null, + "border": null, + "bottom": null, + "display": null, + "flex": null, + "flex_flow": null, + "grid_area": null, + "grid_auto_columns": null, + "grid_auto_flow": null, + "grid_auto_rows": null, + "grid_column": null, + "grid_gap": null, + "grid_row": null, + "grid_template_areas": null, + "grid_template_columns": null, + "grid_template_rows": null, + "height": null, + "justify_content": null, + "justify_items": null, + "left": null, + "margin": null, + "max_height": null, + "max_width": null, + "min_height": null, + "min_width": null, + "object_fit": null, + "object_position": null, + "order": null, + "overflow": null, + "overflow_x": null, + "overflow_y": null, + "padding": null, + "right": null, + "top": null, + "visibility": null, + "width": null + } + }, + "e0191f86888d4331a71009c62777dd87": { + "model_module": "@jupyter-widgets/controls", + "model_name": "DescriptionStyleModel", + "model_module_version": "1.5.0", + "state": { + "_model_module": "@jupyter-widgets/controls", + "_model_module_version": "1.5.0", + "_model_name": "DescriptionStyleModel", + "_view_count": null, + "_view_module": "@jupyter-widgets/base", + "_view_module_version": "1.2.0", + "_view_name": "StyleView", + "description_width": "" + } + } + } + } + }, + "cells": [ + { + "cell_type": "code", + "source": [ + "%%bash\n", + "# install the vall-e and required libraries\n", + "# PyTorch\n", + "pip install torch==1.13.1 torchaudio==0.13.1 --extra-index-url https://download.pytorch.org/whl/cu116\n", + "pip install torchmetrics==0.11.1\n", + "# fbank\n", + "pip install librosa matplotlib\n", + "\n", + "# phonemizer pypinyin\n", + "apt-get install espeak-ng git-lfs -y\n", + "## OSX: brew install espeak\n", + "pip install phonemizer==3.2.1 pypinyin==0.48.0\n", + "\n", + "pip install lhotse\n", + "\n", + "# k2\n", + "# find the right version in https://huggingface.co/csukuangfj/k2\n", + "pip install https://huggingface.co/csukuangfj/k2/resolve/main/cuda/k2-1.23.4.dev20230224+cuda11.6.torch1.13.1-cp310-cp310-linux_x86_64.whl\n", + "mkdir tmp_lib\n", + "\n", + "git clone https://github.com/k2-fsa/icefall\n", + "mv icefall tmp_lib\n", + "cd tmp_lib/icefall\n", + "pip install -r requirements.txt\n", + "pip install -e .\n", + "export PYTHONPATH=`pwd`/../icefall:$PYTHONPATH\n", + "echo \"export PYTHONPATH=`pwd`/../icefall:\\$PYTHONPATH\" >> ~/.zshrc\n", + "echo \"export PYTHONPATH=`pwd`/../icefall:\\$PYTHONPATH\" >> ~/.bashrc\n", + "cd ../..\n", + "source ~/.zshrc\n", + "source ~/.bashrc\n", + "\n", + "\n", + "git clone https://github.com/lifeiteng/vall-e\n", + "mv vall-e tmp_lib\n", + "cd tmp_lib/vall-e\n", + "pip install -e .\n", + "\n", + "pip install vocos\n", + "pip install gradio" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "USn47sC-VKvo", + "outputId": "4afe3379-1136-4903-ca9c-bc10b8281e42" + }, + "execution_count": 1, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Looking in indexes: https://pypi.org/simple, https://download.pytorch.org/whl/cu116\n", + "Requirement already satisfied: torch==1.13.1 in /usr/local/lib/python3.10/dist-packages (1.13.1+cu116)\n", + "Requirement already satisfied: torchaudio==0.13.1 in /usr/local/lib/python3.10/dist-packages (0.13.1+cu116)\n", + "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from torch==1.13.1) (4.8.0)\n", + "Requirement already satisfied: torchmetrics==0.11.1 in /usr/local/lib/python3.10/dist-packages (0.11.1)\n", + "Requirement already satisfied: numpy>=1.17.2 in /usr/local/lib/python3.10/dist-packages (from torchmetrics==0.11.1) (1.23.5)\n", + "Requirement already satisfied: torch>=1.8.1 in /usr/local/lib/python3.10/dist-packages (from torchmetrics==0.11.1) (1.13.1+cu116)\n", + "Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from torchmetrics==0.11.1) (23.1)\n", + "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from torch>=1.8.1->torchmetrics==0.11.1) (4.8.0)\n", + "Requirement already satisfied: librosa in /usr/local/lib/python3.10/dist-packages (0.8.1)\n", + "Requirement already satisfied: matplotlib in /usr/local/lib/python3.10/dist-packages (3.7.1)\n", + "Requirement already satisfied: audioread>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (3.0.0)\n", + "Requirement already satisfied: numpy>=1.15.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.23.5)\n", + "Requirement already satisfied: scipy>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.11.2)\n", + "Requirement already satisfied: scikit-learn!=0.19.0,>=0.14.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.2.2)\n", + "Requirement already satisfied: joblib>=0.14 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.3.2)\n", + "Requirement already satisfied: decorator>=3.0.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (4.4.2)\n", + "Requirement already satisfied: resampy>=0.2.2 in /usr/local/lib/python3.10/dist-packages (from librosa) (0.4.2)\n", + "Requirement already satisfied: numba>=0.43.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (0.56.4)\n", + "Requirement already satisfied: soundfile>=0.10.2 in /usr/local/lib/python3.10/dist-packages (from librosa) (0.12.1)\n", + "Requirement already satisfied: pooch>=1.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (1.7.0)\n", + "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from librosa) (23.1)\n", + "Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (1.1.0)\n", + "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (0.11.0)\n", + "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (4.42.1)\n", + "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (1.4.5)\n", + "Requirement already satisfied: pillow>=6.2.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (9.4.0)\n", + "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (3.1.1)\n", + "Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.10/dist-packages (from matplotlib) (2.8.2)\n", + "Requirement already satisfied: llvmlite<0.40,>=0.39.0dev0 in /usr/local/lib/python3.10/dist-packages (from numba>=0.43.0->librosa) (0.39.1)\n", + "Requirement already satisfied: setuptools in /usr/local/lib/python3.10/dist-packages (from numba>=0.43.0->librosa) (67.7.2)\n", + "Requirement already satisfied: platformdirs>=2.5.0 in /usr/local/lib/python3.10/dist-packages (from pooch>=1.0->librosa) (3.10.0)\n", + "Requirement already satisfied: requests>=2.19.0 in /usr/local/lib/python3.10/dist-packages (from pooch>=1.0->librosa) (2.31.0)\n", + "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.7->matplotlib) (1.16.0)\n", + "Requirement already satisfied: threadpoolctl>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn!=0.19.0,>=0.14.0->librosa) (3.2.0)\n", + "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.10/dist-packages (from soundfile>=0.10.2->librosa) (1.15.1)\n", + "Requirement already satisfied: pycparser in /usr/local/lib/python3.10/dist-packages (from cffi>=1.0->soundfile>=0.10.2->librosa) (2.21)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (3.2.0)\n", + "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (3.4)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2.0.4)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests>=2.19.0->pooch>=1.0->librosa) (2023.7.22)\n", + "Reading package lists...\n", + "Building dependency tree...\n", + "Reading state information...\n", + "espeak-ng is already the newest version (1.50+dfsg-10).\n", + "git-lfs is already the newest version (3.0.2-1ubuntu0.2).\n", + "0 upgraded, 0 newly installed, 0 to remove and 18 not upgraded.\n", + "Requirement already satisfied: phonemizer==3.2.1 in /usr/local/lib/python3.10/dist-packages (3.2.1)\n", + "Requirement already satisfied: pypinyin==0.48.0 in /usr/local/lib/python3.10/dist-packages (0.48.0)\n", + "Requirement already satisfied: joblib in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (1.3.2)\n", + "Requirement already satisfied: segments in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (2.2.1)\n", + "Requirement already satisfied: attrs>=18.1 in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (23.1.0)\n", + "Requirement already satisfied: dlinfo in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (1.2.1)\n", + "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from phonemizer==3.2.1) (4.8.0)\n", + "Requirement already satisfied: clldutils>=1.7.3 in /usr/local/lib/python3.10/dist-packages (from segments->phonemizer==3.2.1) (3.20.0)\n", + "Requirement already satisfied: csvw>=1.5.6 in /usr/local/lib/python3.10/dist-packages (from segments->phonemizer==3.2.1) (3.1.3)\n", + "Requirement already satisfied: regex in /usr/local/lib/python3.10/dist-packages (from segments->phonemizer==3.2.1) (2023.6.3)\n", + "Requirement already satisfied: python-dateutil in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (2.8.2)\n", + "Requirement already satisfied: tabulate>=0.7.7 in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (0.9.0)\n", + "Requirement already satisfied: colorlog in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (6.7.0)\n", + "Requirement already satisfied: pylatexenc in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (2.10)\n", + "Requirement already satisfied: markdown in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (3.4.4)\n", + "Requirement already satisfied: lxml in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (4.9.3)\n", + "Requirement already satisfied: markupsafe in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer==3.2.1) (2.1.3)\n", + "Requirement already satisfied: babel in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (2.12.1)\n", + "Requirement already satisfied: colorama in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (0.4.6)\n", + "Requirement already satisfied: isodate in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (0.6.1)\n", + "Requirement already satisfied: jsonschema in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (4.19.0)\n", + "Requirement already satisfied: language-tags in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (1.2.0)\n", + "Requirement already satisfied: rdflib in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (7.0.0)\n", + "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (2.31.0)\n", + "Requirement already satisfied: rfc3986<2 in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (1.5.0)\n", + "Requirement already satisfied: uritemplate>=3.0.0 in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer==3.2.1) (4.1.1)\n", + "Requirement already satisfied: six in /usr/local/lib/python3.10/dist-packages (from isodate->csvw>=1.5.6->segments->phonemizer==3.2.1) (1.16.0)\n", + "Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.10/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer==3.2.1) (2023.7.1)\n", + "Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.10/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer==3.2.1) (0.30.2)\n", + "Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.10/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer==3.2.1) (0.10.2)\n", + "Requirement already satisfied: pyparsing<4,>=2.1.0 in /usr/local/lib/python3.10/dist-packages (from rdflib->csvw>=1.5.6->segments->phonemizer==3.2.1) (3.1.1)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer==3.2.1) (3.2.0)\n", + "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer==3.2.1) (3.4)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer==3.2.1) (2.0.4)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer==3.2.1) (2023.7.22)\n", + "Requirement already satisfied: lhotse in /usr/local/lib/python3.10/dist-packages (1.16.0)\n", + "Requirement already satisfied: audioread>=2.1.9 in /usr/local/lib/python3.10/dist-packages (from lhotse) (3.0.0)\n", + "Requirement already satisfied: SoundFile>=0.10 in /usr/local/lib/python3.10/dist-packages (from lhotse) (0.12.1)\n", + "Requirement already satisfied: click>=7.1.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (8.1.7)\n", + "Requirement already satisfied: cytoolz>=0.10.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (0.12.2)\n", + "Requirement already satisfied: dataclasses in /usr/local/lib/python3.10/dist-packages (from lhotse) (0.6)\n", + "Requirement already satisfied: intervaltree>=3.1.0 in /usr/local/lib/python3.10/dist-packages (from lhotse) (3.1.0)\n", + "Requirement already satisfied: numpy>=1.18.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (1.23.5)\n", + "Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from lhotse) (23.1)\n", + "Requirement already satisfied: pyyaml>=5.3.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (6.0.1)\n", + "Requirement already satisfied: tabulate>=0.8.1 in /usr/local/lib/python3.10/dist-packages (from lhotse) (0.9.0)\n", + "Requirement already satisfied: tqdm in /usr/local/lib/python3.10/dist-packages (from lhotse) (4.66.1)\n", + "Requirement already satisfied: lilcom>=1.1.0 in /usr/local/lib/python3.10/dist-packages (from lhotse) (1.7)\n", + "Requirement already satisfied: toolz>=0.8.0 in /usr/local/lib/python3.10/dist-packages (from cytoolz>=0.10.1->lhotse) (0.12.0)\n", + "Requirement already satisfied: sortedcontainers<3.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from intervaltree>=3.1.0->lhotse) (2.4.0)\n", + "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.10/dist-packages (from SoundFile>=0.10->lhotse) (1.15.1)\n", + "Requirement already satisfied: pycparser in /usr/local/lib/python3.10/dist-packages (from cffi>=1.0->SoundFile>=0.10->lhotse) (2.21)\n", + "Collecting k2==1.23.4.dev20230224+cuda11.6.torch1.13.1\n", + " Downloading https://huggingface.co/csukuangfj/k2/resolve/main/cuda/k2-1.23.4.dev20230224+cuda11.6.torch1.13.1-cp310-cp310-linux_x86_64.whl (102.9 MB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 102.9/102.9 MB 8.9 MB/s eta 0:00:00\n", + "Requirement already satisfied: torch==1.13.1 in /usr/local/lib/python3.10/dist-packages (from k2==1.23.4.dev20230224+cuda11.6.torch1.13.1) (1.13.1+cu116)\n", + "Requirement already satisfied: graphviz in /usr/local/lib/python3.10/dist-packages (from k2==1.23.4.dev20230224+cuda11.6.torch1.13.1) (0.20.1)\n", + "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from torch==1.13.1->k2==1.23.4.dev20230224+cuda11.6.torch1.13.1) (4.8.0)\n", + "Requirement already satisfied: kaldifst in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 1)) (1.7.5)\n", + "Requirement already satisfied: kaldilm in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 2)) (1.15.1)\n", + "Requirement already satisfied: kaldialign in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 3)) (0.7.2)\n", + "Requirement already satisfied: sentencepiece>=0.1.96 in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 4)) (0.1.99)\n", + "Requirement already satisfied: tensorboard in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 5)) (2.13.0)\n", + "Requirement already satisfied: typeguard in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 6)) (4.1.5)\n", + "Requirement already satisfied: dill in /usr/local/lib/python3.10/dist-packages (from -r requirements.txt (line 7)) (0.3.7)\n", + "Requirement already satisfied: absl-py>=0.4 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (1.4.0)\n", + "Requirement already satisfied: grpcio>=1.48.2 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (1.57.0)\n", + "Requirement already satisfied: google-auth<3,>=1.6.3 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (2.17.3)\n", + "Requirement already satisfied: google-auth-oauthlib<1.1,>=0.5 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (1.0.0)\n", + "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (3.4.4)\n", + "Requirement already satisfied: numpy>=1.12.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (1.23.5)\n", + "Requirement already satisfied: protobuf>=3.19.6 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (3.20.3)\n", + "Requirement already satisfied: requests<3,>=2.21.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (2.31.0)\n", + "Requirement already satisfied: setuptools>=41.0.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (67.7.2)\n", + "Requirement already satisfied: tensorboard-data-server<0.8.0,>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (0.7.1)\n", + "Requirement already satisfied: werkzeug>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (2.3.7)\n", + "Requirement already satisfied: wheel>=0.26 in /usr/local/lib/python3.10/dist-packages (from tensorboard->-r requirements.txt (line 5)) (0.41.2)\n", + "Requirement already satisfied: typing-extensions>=4.7.0 in /usr/local/lib/python3.10/dist-packages (from typeguard->-r requirements.txt (line 6)) (4.8.0)\n", + "Requirement already satisfied: cachetools<6.0,>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->-r requirements.txt (line 5)) (5.3.1)\n", + "Requirement already satisfied: pyasn1-modules>=0.2.1 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->-r requirements.txt (line 5)) (0.3.0)\n", + "Requirement already satisfied: six>=1.9.0 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->-r requirements.txt (line 5)) (1.16.0)\n", + "Requirement already satisfied: rsa<5,>=3.1.4 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->-r requirements.txt (line 5)) (4.9)\n", + "Requirement already satisfied: requests-oauthlib>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from google-auth-oauthlib<1.1,>=0.5->tensorboard->-r requirements.txt (line 5)) (1.3.1)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.21.0->tensorboard->-r requirements.txt (line 5)) (3.2.0)\n", + "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.21.0->tensorboard->-r requirements.txt (line 5)) (3.4)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.21.0->tensorboard->-r requirements.txt (line 5)) (2.0.4)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.21.0->tensorboard->-r requirements.txt (line 5)) (2023.7.22)\n", + "Requirement already satisfied: MarkupSafe>=2.1.1 in /usr/local/lib/python3.10/dist-packages (from werkzeug>=1.0.1->tensorboard->-r requirements.txt (line 5)) (2.1.3)\n", + "Requirement already satisfied: pyasn1<0.6.0,>=0.4.6 in /usr/local/lib/python3.10/dist-packages (from pyasn1-modules>=0.2.1->google-auth<3,>=1.6.3->tensorboard->-r requirements.txt (line 5)) (0.5.0)\n", + "Requirement already satisfied: oauthlib>=3.0.0 in /usr/local/lib/python3.10/dist-packages (from requests-oauthlib>=0.7.0->google-auth-oauthlib<1.1,>=0.5->tensorboard->-r requirements.txt (line 5)) (3.2.2)\n", + "Obtaining file:///content/tmp_lib/icefall\n", + " Installing build dependencies: started\n", + " Installing build dependencies: finished with status 'done'\n", + " Checking if build backend supports build_editable: started\n", + " Checking if build backend supports build_editable: finished with status 'done'\n", + " Getting requirements to build editable: started\n", + " Getting requirements to build editable: finished with status 'done'\n", + " Preparing editable metadata (pyproject.toml): started\n", + " Preparing editable metadata (pyproject.toml): finished with status 'done'\n", + "Requirement already satisfied: kaldifst in /usr/local/lib/python3.10/dist-packages (from icefall==1.0) (1.7.5)\n", + "Requirement already satisfied: kaldilm in /usr/local/lib/python3.10/dist-packages (from icefall==1.0) (1.15.1)\n", + "Requirement already satisfied: kaldialign in /usr/local/lib/python3.10/dist-packages (from icefall==1.0) (0.7.2)\n", + "Requirement already satisfied: sentencepiece>=0.1.96 in /usr/local/lib/python3.10/dist-packages (from icefall==1.0) (0.1.99)\n", + "Requirement already satisfied: tensorboard in /usr/local/lib/python3.10/dist-packages (from icefall==1.0) (2.13.0)\n", + "Requirement already satisfied: typeguard in /usr/local/lib/python3.10/dist-packages (from icefall==1.0) (4.1.5)\n", + "Requirement already satisfied: dill in /usr/local/lib/python3.10/dist-packages (from icefall==1.0) (0.3.7)\n", + "Requirement already satisfied: absl-py>=0.4 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (1.4.0)\n", + "Requirement already satisfied: grpcio>=1.48.2 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (1.57.0)\n", + "Requirement already satisfied: google-auth<3,>=1.6.3 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (2.17.3)\n", + "Requirement already satisfied: google-auth-oauthlib<1.1,>=0.5 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (1.0.0)\n", + "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (3.4.4)\n", + "Requirement already satisfied: numpy>=1.12.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (1.23.5)\n", + "Requirement already satisfied: protobuf>=3.19.6 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (3.20.3)\n", + "Requirement already satisfied: requests<3,>=2.21.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (2.31.0)\n", + "Requirement already satisfied: setuptools>=41.0.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (67.7.2)\n", + "Requirement already satisfied: tensorboard-data-server<0.8.0,>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (0.7.1)\n", + "Requirement already satisfied: werkzeug>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (2.3.7)\n", + "Requirement already satisfied: wheel>=0.26 in /usr/local/lib/python3.10/dist-packages (from tensorboard->icefall==1.0) (0.41.2)\n", + "Requirement already satisfied: typing-extensions>=4.7.0 in /usr/local/lib/python3.10/dist-packages (from typeguard->icefall==1.0) (4.8.0)\n", + "Requirement already satisfied: cachetools<6.0,>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->icefall==1.0) (5.3.1)\n", + "Requirement already satisfied: pyasn1-modules>=0.2.1 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->icefall==1.0) (0.3.0)\n", + "Requirement already satisfied: six>=1.9.0 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->icefall==1.0) (1.16.0)\n", + "Requirement already satisfied: rsa<5,>=3.1.4 in /usr/local/lib/python3.10/dist-packages (from google-auth<3,>=1.6.3->tensorboard->icefall==1.0) (4.9)\n", + "Requirement already satisfied: requests-oauthlib>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from google-auth-oauthlib<1.1,>=0.5->tensorboard->icefall==1.0) (1.3.1)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.21.0->tensorboard->icefall==1.0) (3.2.0)\n", + "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.21.0->tensorboard->icefall==1.0) (3.4)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.21.0->tensorboard->icefall==1.0) (2.0.4)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests<3,>=2.21.0->tensorboard->icefall==1.0) (2023.7.22)\n", + "Requirement already satisfied: MarkupSafe>=2.1.1 in /usr/local/lib/python3.10/dist-packages (from werkzeug>=1.0.1->tensorboard->icefall==1.0) (2.1.3)\n", + "Requirement already satisfied: pyasn1<0.6.0,>=0.4.6 in /usr/local/lib/python3.10/dist-packages (from pyasn1-modules>=0.2.1->google-auth<3,>=1.6.3->tensorboard->icefall==1.0) (0.5.0)\n", + "Requirement already satisfied: oauthlib>=3.0.0 in /usr/local/lib/python3.10/dist-packages (from requests-oauthlib>=0.7.0->google-auth-oauthlib<1.1,>=0.5->tensorboard->icefall==1.0) (3.2.2)\n", + "Building wheels for collected packages: icefall\n", + " Building editable for icefall (pyproject.toml): started\n", + " Building editable for icefall (pyproject.toml): finished with status 'done'\n", + " Created wheel for icefall: filename=icefall-1.0-0.editable-py3-none-any.whl size=6938 sha256=a82e786befc35808f23d067a3fae3a47f2e3d386cb8f5dc3985a21af73b85c0f\n", + " Stored in directory: /tmp/pip-ephem-wheel-cache-bk20tk10/wheels/8b/61/8c/6ab9252dbb8103b07c7e54134628c2bac869e1cb195484f840\n", + "Successfully built icefall\n", + "Installing collected packages: icefall\n", + " Attempting uninstall: icefall\n", + " Found existing installation: icefall 1.0\n", + " Uninstalling icefall-1.0:\n", + " Successfully uninstalled icefall-1.0\n", + "Successfully installed icefall-1.0\n", + "Obtaining file:///content/tmp_lib/vall-e\n", + " Preparing metadata (setup.py): started\n", + " Preparing metadata (setup.py): finished with status 'done'\n", + "Requirement already satisfied: encodec in /usr/local/lib/python3.10/dist-packages (from valle==1.0.0.dev0+git.d5cf330.clean) (0.1.1)\n", + "Requirement already satisfied: phonemizer in /usr/local/lib/python3.10/dist-packages (from valle==1.0.0.dev0+git.d5cf330.clean) (3.2.1)\n", + "Requirement already satisfied: numpy in /usr/local/lib/python3.10/dist-packages (from encodec->valle==1.0.0.dev0+git.d5cf330.clean) (1.23.5)\n", + "Requirement already satisfied: torch in /usr/local/lib/python3.10/dist-packages (from encodec->valle==1.0.0.dev0+git.d5cf330.clean) (1.13.1+cu116)\n", + "Requirement already satisfied: torchaudio in /usr/local/lib/python3.10/dist-packages (from encodec->valle==1.0.0.dev0+git.d5cf330.clean) (0.13.1+cu116)\n", + "Requirement already satisfied: einops in /usr/local/lib/python3.10/dist-packages (from encodec->valle==1.0.0.dev0+git.d5cf330.clean) (0.6.1)\n", + "Requirement already satisfied: joblib in /usr/local/lib/python3.10/dist-packages (from phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (1.3.2)\n", + "Requirement already satisfied: segments in /usr/local/lib/python3.10/dist-packages (from phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2.2.1)\n", + "Requirement already satisfied: attrs>=18.1 in /usr/local/lib/python3.10/dist-packages (from phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (23.1.0)\n", + "Requirement already satisfied: dlinfo in /usr/local/lib/python3.10/dist-packages (from phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (1.2.1)\n", + "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.10/dist-packages (from phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (4.8.0)\n", + "Requirement already satisfied: clldutils>=1.7.3 in /usr/local/lib/python3.10/dist-packages (from segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (3.20.0)\n", + "Requirement already satisfied: csvw>=1.5.6 in /usr/local/lib/python3.10/dist-packages (from segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (3.1.3)\n", + "Requirement already satisfied: regex in /usr/local/lib/python3.10/dist-packages (from segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2023.6.3)\n", + "Requirement already satisfied: python-dateutil in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2.8.2)\n", + "Requirement already satisfied: tabulate>=0.7.7 in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (0.9.0)\n", + "Requirement already satisfied: colorlog in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (6.7.0)\n", + "Requirement already satisfied: pylatexenc in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2.10)\n", + "Requirement already satisfied: markdown in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (3.4.4)\n", + "Requirement already satisfied: lxml in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (4.9.3)\n", + "Requirement already satisfied: markupsafe in /usr/local/lib/python3.10/dist-packages (from clldutils>=1.7.3->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2.1.3)\n", + "Requirement already satisfied: babel in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2.12.1)\n", + "Requirement already satisfied: colorama in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (0.4.6)\n", + "Requirement already satisfied: isodate in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (0.6.1)\n", + "Requirement already satisfied: jsonschema in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (4.19.0)\n", + "Requirement already satisfied: language-tags in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (1.2.0)\n", + "Requirement already satisfied: rdflib in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (7.0.0)\n", + "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2.31.0)\n", + "Requirement already satisfied: rfc3986<2 in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (1.5.0)\n", + "Requirement already satisfied: uritemplate>=3.0.0 in /usr/local/lib/python3.10/dist-packages (from csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (4.1.1)\n", + "Requirement already satisfied: six in /usr/local/lib/python3.10/dist-packages (from isodate->csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (1.16.0)\n", + "Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.10/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2023.7.1)\n", + "Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.10/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (0.30.2)\n", + "Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.10/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (0.10.2)\n", + "Requirement already satisfied: pyparsing<4,>=2.1.0 in /usr/local/lib/python3.10/dist-packages (from rdflib->csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (3.1.1)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (3.2.0)\n", + "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (3.4)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2.0.4)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->csvw>=1.5.6->segments->phonemizer->valle==1.0.0.dev0+git.d5cf330.clean) (2023.7.22)\n", + "Installing collected packages: valle\n", + " Attempting uninstall: valle\n", + " Found existing installation: valle 1.0.0.dev0+git.d5cf330.clean\n", + " Uninstalling valle-1.0.0.dev0+git.d5cf330.clean:\n", + " Successfully uninstalled valle-1.0.0.dev0+git.d5cf330.clean\n", + " Running setup.py develop for valle\n", + "Successfully installed valle-1.0.0.dev0+git.d5cf330.clean\n", + "Requirement already satisfied: vocos in /usr/local/lib/python3.10/dist-packages (0.0.3)\n", + "Requirement already satisfied: torch in /usr/local/lib/python3.10/dist-packages (from vocos) (1.13.1+cu116)\n", + "Requirement already satisfied: torchaudio in /usr/local/lib/python3.10/dist-packages (from vocos) (0.13.1+cu116)\n", + "Requirement already satisfied: numpy in /usr/local/lib/python3.10/dist-packages (from vocos) (1.23.5)\n", + "Requirement already satisfied: scipy in /usr/local/lib/python3.10/dist-packages (from vocos) (1.11.2)\n", + "Requirement already satisfied: einops in /usr/local/lib/python3.10/dist-packages (from vocos) (0.6.1)\n", + "Requirement already satisfied: pyyaml in /usr/local/lib/python3.10/dist-packages (from vocos) (6.0.1)\n", + "Requirement already satisfied: huggingface-hub in /usr/local/lib/python3.10/dist-packages (from vocos) (0.17.2)\n", + "Requirement already satisfied: encodec==0.1.1 in /usr/local/lib/python3.10/dist-packages (from vocos) (0.1.1)\n", + "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface-hub->vocos) (3.12.2)\n", + "Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from huggingface-hub->vocos) (2023.6.0)\n", + "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from huggingface-hub->vocos) (2.31.0)\n", + "Requirement already satisfied: tqdm>=4.42.1 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub->vocos) (4.66.1)\n", + "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub->vocos) (4.8.0)\n", + "Requirement already satisfied: packaging>=20.9 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub->vocos) (23.1)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface-hub->vocos) (3.2.0)\n", + "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface-hub->vocos) (3.4)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface-hub->vocos) (2.0.4)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->huggingface-hub->vocos) (2023.7.22)\n", + "Collecting gradio\n", + " Downloading gradio-3.44.4-py3-none-any.whl (20.2 MB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 20.2/20.2 MB 59.7 MB/s eta 0:00:00\n", + "Collecting aiofiles<24.0,>=22.0 (from gradio)\n", + " Downloading aiofiles-23.2.1-py3-none-any.whl (15 kB)\n", + "Requirement already satisfied: altair<6.0,>=4.2.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (4.2.2)\n", + "Collecting fastapi (from gradio)\n", + " Downloading fastapi-0.103.1-py3-none-any.whl (66 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 66.2/66.2 kB 6.9 MB/s eta 0:00:00\n", + "Collecting ffmpy (from gradio)\n", + " Downloading ffmpy-0.3.1.tar.gz (5.5 kB)\n", + " Preparing metadata (setup.py): started\n", + " Preparing metadata (setup.py): finished with status 'done'\n", + "Collecting gradio-client==0.5.1 (from gradio)\n", + " Downloading gradio_client-0.5.1-py3-none-any.whl (298 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 298.2/298.2 kB 21.5 MB/s eta 0:00:00\n", + "Collecting httpx (from gradio)\n", + " Downloading httpx-0.25.0-py3-none-any.whl (75 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 75.7/75.7 kB 7.9 MB/s eta 0:00:00\n", + "Requirement already satisfied: huggingface-hub>=0.14.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (0.17.2)\n", + "Requirement already satisfied: importlib-resources<7.0,>=1.3 in /usr/local/lib/python3.10/dist-packages (from gradio) (6.0.1)\n", + "Requirement already satisfied: jinja2<4.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (3.1.2)\n", + "Requirement already satisfied: markupsafe~=2.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (2.1.3)\n", + "Requirement already satisfied: matplotlib~=3.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (3.7.1)\n", + "Requirement already satisfied: numpy~=1.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (1.23.5)\n", + "Collecting orjson~=3.0 (from gradio)\n", + " Downloading orjson-3.9.7-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (138 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 138.7/138.7 kB 15.4 MB/s eta 0:00:00\n", + "Requirement already satisfied: packaging in /usr/local/lib/python3.10/dist-packages (from gradio) (23.1)\n", + "Requirement already satisfied: pandas<3.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (1.5.3)\n", + "Requirement already satisfied: pillow<11.0,>=8.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (9.4.0)\n", + "Requirement already satisfied: pydantic!=1.8,!=1.8.1,!=2.0.0,!=2.0.1,<3.0.0,>=1.7.4 in /usr/local/lib/python3.10/dist-packages (from gradio) (1.10.12)\n", + "Collecting pydub (from gradio)\n", + " Downloading pydub-0.25.1-py2.py3-none-any.whl (32 kB)\n", + "Collecting python-multipart (from gradio)\n", + " Downloading python_multipart-0.0.6-py3-none-any.whl (45 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 45.7/45.7 kB 4.6 MB/s eta 0:00:00\n", + "Requirement already satisfied: pyyaml<7.0,>=5.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (6.0.1)\n", + "Requirement already satisfied: requests~=2.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (2.31.0)\n", + "Collecting semantic-version~=2.0 (from gradio)\n", + " Downloading semantic_version-2.10.0-py2.py3-none-any.whl (15 kB)\n", + "Requirement already satisfied: typing-extensions~=4.0 in /usr/local/lib/python3.10/dist-packages (from gradio) (4.8.0)\n", + "Collecting uvicorn>=0.14.0 (from gradio)\n", + " Downloading uvicorn-0.23.2-py3-none-any.whl (59 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 59.5/59.5 kB 6.4 MB/s eta 0:00:00\n", + "Collecting websockets<12.0,>=10.0 (from gradio)\n", + " Downloading websockets-11.0.3-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (129 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 129.9/129.9 kB 13.7 MB/s eta 0:00:00\n", + "Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from gradio-client==0.5.1->gradio) (2023.6.0)\n", + "Requirement already satisfied: entrypoints in /usr/local/lib/python3.10/dist-packages (from altair<6.0,>=4.2.0->gradio) (0.4)\n", + "Requirement already satisfied: jsonschema>=3.0 in /usr/local/lib/python3.10/dist-packages (from altair<6.0,>=4.2.0->gradio) (4.19.0)\n", + "Requirement already satisfied: toolz in /usr/local/lib/python3.10/dist-packages (from altair<6.0,>=4.2.0->gradio) (0.12.0)\n", + "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from huggingface-hub>=0.14.0->gradio) (3.12.2)\n", + "Requirement already satisfied: tqdm>=4.42.1 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub>=0.14.0->gradio) (4.66.1)\n", + "Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (1.1.0)\n", + "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (0.11.0)\n", + "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (4.42.1)\n", + "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (1.4.5)\n", + "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (3.1.1)\n", + "Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.10/dist-packages (from matplotlib~=3.0->gradio) (2.8.2)\n", + "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas<3.0,>=1.0->gradio) (2023.3.post1)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests~=2.0->gradio) (3.2.0)\n", + "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests~=2.0->gradio) (3.4)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests~=2.0->gradio) (2.0.4)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests~=2.0->gradio) (2023.7.22)\n", + "Requirement already satisfied: click>=7.0 in /usr/local/lib/python3.10/dist-packages (from uvicorn>=0.14.0->gradio) (8.1.7)\n", + "Collecting h11>=0.8 (from uvicorn>=0.14.0->gradio)\n", + " Downloading h11-0.14.0-py3-none-any.whl (58 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 58.3/58.3 kB 6.1 MB/s eta 0:00:00\n", + "Requirement already satisfied: anyio<4.0.0,>=3.7.1 in /usr/local/lib/python3.10/dist-packages (from fastapi->gradio) (3.7.1)\n", + "Collecting starlette<0.28.0,>=0.27.0 (from fastapi->gradio)\n", + " Downloading starlette-0.27.0-py3-none-any.whl (66 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 67.0/67.0 kB 7.8 MB/s eta 0:00:00\n", + "Collecting httpcore<0.19.0,>=0.18.0 (from httpx->gradio)\n", + " Downloading httpcore-0.18.0-py3-none-any.whl (76 kB)\n", + " ━━━━━━━━━━━━━━━━━━━━━��━━━━━━━━━━━━━━━━━━ 76.0/76.0 kB 8.1 MB/s eta 0:00:00\n", + "Requirement already satisfied: sniffio in /usr/local/lib/python3.10/dist-packages (from httpx->gradio) (1.3.0)\n", + "Requirement already satisfied: exceptiongroup in /usr/local/lib/python3.10/dist-packages (from anyio<4.0.0,>=3.7.1->fastapi->gradio) (1.1.3)\n", + "Requirement already satisfied: attrs>=22.2.0 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio) (23.1.0)\n", + "Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio) (2023.7.1)\n", + "Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio) (0.30.2)\n", + "Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.10/dist-packages (from jsonschema>=3.0->altair<6.0,>=4.2.0->gradio) (0.10.2)\n", + "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.7->matplotlib~=3.0->gradio) (1.16.0)\n", + "Building wheels for collected packages: ffmpy\n", + " Building wheel for ffmpy (setup.py): started\n", + " Building wheel for ffmpy (setup.py): finished with status 'done'\n", + " Created wheel for ffmpy: filename=ffmpy-0.3.1-py3-none-any.whl size=5579 sha256=b36d159f82a22c76b9424d2bbbed3b8d1a99772b68f92f6a9a71bf6f935bd3b6\n", + " Stored in directory: /root/.cache/pip/wheels/01/a6/d1/1c0828c304a4283b2c1639a09ad86f83d7c487ef34c6b4a1bf\n", + "Successfully built ffmpy\n", + "Installing collected packages: pydub, ffmpy, websockets, semantic-version, python-multipart, orjson, h11, aiofiles, uvicorn, starlette, httpcore, httpx, fastapi, gradio-client, gradio\n", + "Successfully installed aiofiles-23.2.1 fastapi-0.103.1 ffmpy-0.3.1 gradio-3.44.4 gradio-client-0.5.1 h11-0.14.0 httpcore-0.18.0 httpx-0.25.0 orjson-3.9.7 pydub-0.25.1 python-multipart-0.0.6 semantic-version-2.10.0 starlette-0.27.0 uvicorn-0.23.2 websockets-11.0.3\n" + ] + }, + { + "output_type": "stream", + "name": "stderr", + "text": [ + "mkdir: cannot create directory ‘tmp_lib’: File exists\n", + "Cloning into 'icefall'...\n", + "mv: cannot move 'icefall' to 'tmp_lib/icefall': Directory not empty\n", + "Cloning into 'vall-e'...\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "!wget https://huggingface.co/LearnItAnyway/vall-e_korean/resolve/main/vall-e_ko_v0.pt\n", + "!wget https://huggingface.co/LearnItAnyway/vall-e_korean/resolve/main/unique_text_tokens.k2symbols" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "PMNAqnktVw1f", + "outputId": "e9b623e1-c430-4125-976d-b175af09c194" + }, + "execution_count": 2, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "--2023-09-21 06:51:42-- https://huggingface.co/LearnItAnyway/vall-e_korean/resolve/main/vall-e_ko_v0.pt\n", + "Resolving huggingface.co (huggingface.co)... 65.8.178.93, 65.8.178.27, 65.8.178.118, ...\n", + "Connecting to huggingface.co (huggingface.co)|65.8.178.93|:443... connected.\n", + "HTTP request sent, awaiting response... 302 Found\n", + "Location: https://cdn-lfs.huggingface.co/repos/f8/b9/f8b90061950052a23944dd83f71a6f031a5d39c73dbb799693620ca8a4186a97/e2894775b160c24132f8f6d6d7df6cc8bf59a9b465778d08989e200859610560?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27vall-e_ko_v0.pt%3B+filename%3D%22vall-e_ko_v0.pt%22%3B&Expires=1695538302&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NTUzODMwMn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9mOC9iOS9mOGI5MDA2MTk1MDA1MmEyMzk0NGRkODNmNzFhNmYwMzFhNWQzOWM3M2RiYjc5OTY5MzYyMGNhOGE0MTg2YTk3L2UyODk0Nzc1YjE2MGMyNDEzMmY4ZjZkNmQ3ZGY2Y2M4YmY1OWE5YjQ2NTc3OGQwODk4OWUyMDA4NTk2MTA1NjA%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=TdG-TKfzyMK3IjFKx5xrIImhwDNTjgbtm0rYqIvCBWvGm%7EHC1ymtwN3WlhNNc0FSZ-QDR2wnmplNbK33mO9MHPtYqgzWRfiXZsHxUkWuU67eAVyRRgrxqMWrUA69Zc%7E0IBQOxSnU3yVDwKoP-Up7s1gIElgTODwK-hjVFKDc9gdEnQEBMQBYlPey7g2lFUcFdstKl6KEop%7EbyPL%7EHO6qUknp7iWdkwXEy7WCEdu1qjqmrCjysep2QDtlwoLLTdol-YOY8Qko4Bn-esR4pu3Qx5%7EHfx3hn3bCHjyTBykRyuigdIBuUcxbi5ULUU8xjSacReY-on9b%7EH-FQu5WnKGCeQ__&Key-Pair-Id=KVTP0A1DKRTAX [following]\n", + "--2023-09-21 06:51:42-- https://cdn-lfs.huggingface.co/repos/f8/b9/f8b90061950052a23944dd83f71a6f031a5d39c73dbb799693620ca8a4186a97/e2894775b160c24132f8f6d6d7df6cc8bf59a9b465778d08989e200859610560?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27vall-e_ko_v0.pt%3B+filename%3D%22vall-e_ko_v0.pt%22%3B&Expires=1695538302&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTY5NTUzODMwMn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5odWdnaW5nZmFjZS5jby9yZXBvcy9mOC9iOS9mOGI5MDA2MTk1MDA1MmEyMzk0NGRkODNmNzFhNmYwMzFhNWQzOWM3M2RiYjc5OTY5MzYyMGNhOGE0MTg2YTk3L2UyODk0Nzc1YjE2MGMyNDEzMmY4ZjZkNmQ3ZGY2Y2M4YmY1OWE5YjQ2NTc3OGQwODk4OWUyMDA4NTk2MTA1NjA%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=TdG-TKfzyMK3IjFKx5xrIImhwDNTjgbtm0rYqIvCBWvGm%7EHC1ymtwN3WlhNNc0FSZ-QDR2wnmplNbK33mO9MHPtYqgzWRfiXZsHxUkWuU67eAVyRRgrxqMWrUA69Zc%7E0IBQOxSnU3yVDwKoP-Up7s1gIElgTODwK-hjVFKDc9gdEnQEBMQBYlPey7g2lFUcFdstKl6KEop%7EbyPL%7EHO6qUknp7iWdkwXEy7WCEdu1qjqmrCjysep2QDtlwoLLTdol-YOY8Qko4Bn-esR4pu3Qx5%7EHfx3hn3bCHjyTBykRyuigdIBuUcxbi5ULUU8xjSacReY-on9b%7EH-FQu5WnKGCeQ__&Key-Pair-Id=KVTP0A1DKRTAX\n", + "Resolving cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)... 108.157.162.95, 108.157.162.27, 108.157.162.99, ...\n", + "Connecting to cdn-lfs.huggingface.co (cdn-lfs.huggingface.co)|108.157.162.95|:443... connected.\n", + "HTTP request sent, awaiting response... 200 OK\n", + "Length: 2699959616 (2.5G) [binary/octet-stream]\n", + "Saving to: ‘vall-e_ko_v0.pt.2’\n", + "\n", + "vall-e_ko_v0.pt.2 8%[> ] 230.57M 34.9MB/s eta 69s ^C\n", + "--2023-09-21 06:51:49-- https://huggingface.co/LearnItAnyway/vall-e_korean/resolve/main/unique_text_tokens.k2symbols\n", + "Resolving huggingface.co (huggingface.co)... 65.8.178.93, 65.8.178.27, 65.8.178.118, ...\n", + "Connecting to huggingface.co (huggingface.co)|65.8.178.93|:443... connected.\n", + "HTTP request sent, awaiting response... 200 OK\n", + "Length: 3238 (3.2K) [text/plain]\n", + "Saving to: ‘unique_text_tokens.k2symbols.2’\n", + "\n", + "unique_text_tokens. 100%[===================>] 3.16K --.-KB/s in 0s \n", + "\n", + "2023-09-21 06:51:50 (659 MB/s) - ‘unique_text_tokens.k2symbols.2’ saved [3238/3238]\n", + "\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "from IPython.core.display import HTML\n", + "HTML(\"\")" + ], + "metadata": { + "id": "LeYX_9zQfBUH" + }, + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "import argparse\n", + "import logging\n", + "import os\n", + "import pathlib\n", + "import time\n", + "import tempfile\n", + "import platform\n", + "import webbrowser\n", + "import sys\n", + "import torch, torchaudio\n", + "import random\n", + "\n", + "import numpy as np\n", + "\n", + "from valle.data import (\n", + " AudioTokenizer,\n", + " TextTokenizer,\n", + " tokenize_audio,\n", + " tokenize_text,\n", + ")\n", + "from icefall.utils import AttributeDict\n", + "from valle.data.collation import get_text_token_collater\n", + "from valle.models import get_model\n", + "\n", + "from vocos import Vocos\n", + "from encodec.utils import convert_audio\n", + "import multiprocessing\n", + "\n", + "thread_count = multiprocessing.cpu_count()\n", + "\n", + "print(\"Use\",thread_count,\"cpu cores for computing\")\n", + "\n", + "torch.set_num_threads(thread_count)\n", + "torch.set_num_interop_threads(thread_count)\n", + "torch._C._jit_set_profiling_executor(False)\n", + "torch._C._jit_set_profiling_mode(False)\n", + "torch._C._set_graph_executor_optimize(False)\n", + "\n", + "text_tokenizer = TextTokenizer(language='ko')\n", + "\n", + "device = torch.device(\"cpu\")\n", + "if torch.cuda.is_available():\n", + " device = torch.device(\"cuda\", 0)\n", + "\n", + "checkpoint = torch.load(\"./vall-e_ko_v0.pt\", map_location='cpu')\n", + "model = get_model(AttributeDict(checkpoint))\n", + "missing_keys, unexpected_keys = model.load_state_dict(\n", + " checkpoint[\"model\"], strict=True\n", + ")\n", + "assert not missing_keys\n", + "model.eval()\n", + "model.to(device)\n", + "text_collater = get_text_token_collater('./unique_text_tokens.k2symbols')\n", + "\n", + "# Encodec model\n", + "audio_tokenizer = AudioTokenizer(device)\n", + "\n", + "# Vocos decoder\n", + "vocos = Vocos.from_pretrained('charactr/vocos-encodec-24khz').to(device)\n", + "\n", + "model.to(device)\n", + "@torch.no_grad()\n", + "def infer_from_prompt(text_prompt, audio_prompt, text):\n", + " ## text to token\n", + " text_tokens, text_tokens_lens = text_collater(\n", + " [\n", + " tokenize_text(\n", + " text_tokenizer, text=f\"{text_prompt} {text}\".strip()\n", + " )\n", + " ]\n", + " )\n", + " _, enroll_x_lens = text_collater(\n", + " [\n", + " tokenize_text(\n", + " text_tokenizer, text=f\"{text_prompt}\".strip()\n", + " )\n", + " ]\n", + " )\n", + " print('text_loaded')\n", + "\n", + " # text to synthesize\n", + " wav_pr, sr = torchaudio.load(audio_prompt)\n", + " wav_pr = convert_audio(wav_pr, sr, audio_tokenizer.sample_rate, audio_tokenizer.channels)\n", + " audio_prompts = audio_tokenizer.encode(wav_pr.unsqueeze(0))[0][0].transpose(2, 1).to(device)\n", + " print('Audio encoded')\n", + "\n", + " encoded_frames = model.inference(\n", + " text_tokens.to(device), text_tokens_lens.to(device),\n", + " audio_prompts, enroll_x_lens=enroll_x_lens,\n", + " top_k=-100, temperature=1)\n", + " vocos_features = vocos.codes_to_features(encoded_frames.permute(2, 0, 1))\n", + " samples = vocos.decode(vocos_features, bandwidth_id=torch.tensor([2], device=device))\n", + " message = f\"sythesized text: {text}\"\n", + " return message, (24000, samples.squeeze(0).cpu().numpy())\n", + "\n", + "import gradio as gr\n", + "app = gr.Blocks(title=\"VALL-E Korean\")\n", + "with app:\n", + " #gr.Markdown(top_md)\n", + " with gr.Tab(\"VALL-E Korean Demo\"):\n", + " #gr.Markdown(infer_from_prompt_md)\n", + " with gr.Row():\n", + " with gr.Column():\n", + " text_prompt = gr.TextArea(label=\"Input Text\",\n", + " placeholder=\"Type text in the audio file (Korean)\",)\n", + " audio_prompt= gr.Audio(label=\"Input Audio\", source='upload', interactive=True, type=\"filepath\")\n", + " text_input = gr.TextArea(label=\"Output Text\",\n", + " placeholder=\"Type text you want to generate (Korean)\",)\n", + " with gr.Column():\n", + " text_output = gr.Textbox(label=\"Message\")\n", + " audio_output= gr.Audio(label=\"Output Audio\")\n", + " btn = gr.Button(\"Generate!\")\n", + " btn.click(infer_from_prompt,\n", + " inputs=[text_prompt, audio_prompt, text_input],\n", + " outputs=[text_output, audio_output])\n", + "webbrowser.open(\"http://127.0.0.1:7860\")\n", + "app.launch(share=True)" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/", + "height": 784, + "referenced_widgets": [ + "65c70bc500eb48f5a3f664634c9abcb8", + "e03b82ed14aa4f72a98fb62f1b9c1772", + "53daa6d66f3644a2836c1f6e5fefbec2", + "4dd5a724ed7d4fa4ba53723176e008b3", + "7452489dd0df4407b70ab4e00f5a3647", + "29229fdd1a7840099d95a7d0f9164a37", + "917f0a55fb974d3dae0b6ce1cf9cf431", + "4f2dde1811344bf8b6a2c5630107b27c", + "d8cf02c364984d77a6d0f104468493fe", + "283cb331d5be41a6a2804804ab4157f8", + "8dea68cdeab940c6a8848b29fb0acc15", + "3c22fa692f674ef4b278928f18cb2e25", + "c8ccf1019747488b81f89037eca5fbc8", + "2b0b5807a9ef4469b1743900110a66d6", + "adddef9c7f69491894a6449cb568e1c5", + "53fa963136ee49e9b29a7ec9355dd68b", + "ba8fba46da4646c99abd88eb4060e10d", + "b35da4e51cca44ab873c63670744d70c", + "8f8ee8e8131c454d926827ca952a7a32", + "f0dc52160c87446ea60b76e1d7c7decf", + "9099eec49e5a40e09956e32fff04f01e", + "21c102c08fab49acb2b0b9a3f62f1a43", + "c1dd8f5b533d4f018a47eb72bc12bab9", + "0e0384525e8d48b290250099ee19c673", + "f5e0db29e9654975b32c82598a7e0b7e", + "ddaa862b183f46a5947e552ed765206c", + "9634a4f60ff14e7a8c1a8cff38ef9954", + "f7ca8116da184a6c89faa834e1d50b1b", + "535675fafe0644c7ace668fe263f8e03", + "5c8f17eec77b425f8f14a1ac9a8407ed", + "85b19f90c93748b0ba2ef5e936912456", + "309077bf93fe469f96bfc657ea5dd520", + "e0191f86888d4331a71009c62777dd87" + ] + }, + "id": "hZe6v82nW5wb", + "outputId": "9d532f04-4b0f-48a8-b544-9b62e1f5249b" + }, + "execution_count": 4, + "outputs": [ + { + "output_type": "stream", + "name": "stderr", + "text": [ + "/usr/local/lib/python3.10/dist-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: '/usr/local/lib/python3.10/dist-packages/torchvision/image.so: undefined symbol: _ZN3c104cuda20CUDACachingAllocator9allocatorE'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source?\n", + " warn(\n" + ] + }, + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Use 2 cpu cores for computing\n" + ] + }, + { + "output_type": "stream", + "name": "stderr", + "text": [ + "Downloading: \"https://dl.fbaipublicfiles.com/encodec/v0/encodec_24khz-d7cc33bc.th\" to /root/.cache/torch/hub/checkpoints/encodec_24khz-d7cc33bc.th\n" + ] + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + " 0%| | 0.00/88.9M [00:00" + ], + "text/html": [ + "
" + ] + }, + "metadata": {} + }, + { + "output_type": "execute_result", + "data": { + "text/plain": [] + }, + "metadata": {}, + "execution_count": 4 + } + ] + }, + { + "cell_type": "code", + "source": [], + "metadata": { + "id": "ozaZVeomaJAg" + }, + "execution_count": 4, + "outputs": [] + } + ] +} \ No newline at end of file