diff --git a/week1_06_question_answering_and_tts/practice_question_answering_and_tts.ipynb b/week1_06_question_answering_and_tts/practice_question_answering_and_tts.ipynb index 8ef668548..df3c322db 100644 --- a/week1_06_question_answering_and_tts/practice_question_answering_and_tts.ipynb +++ b/week1_06_question_answering_and_tts/practice_question_answering_and_tts.ipynb @@ -4,15 +4,14 @@ "metadata": { "accelerator": "GPU", "colab": { - "name": "Question Answering with a Fine-Tuned BERT.ipynb", + "name": "practice_question_answering_and_tts.ipynb", "provenance": [], - "collapsed_sections": [], - "toc_visible": true + "collapsed_sections": [] }, "kernelspec": { - "display_name": "Py3 bot", + "display_name": "Python 3 (ipykernel)", "language": "python", - "name": "py3_bot" + "name": "python3" }, "language_info": { "codemirror_mode": { @@ -24,363 +23,18 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.7.9" - }, - "widgets": { - "application/vnd.jupyter.widget-state+json": { - "019b4f79cede42e89bdf3b2f5047a3bf": { - "model_module": "@jupyter-widgets/controls", - "model_name": "HBoxModel", - "model_module_version": "1.5.0", - "state": { - "_view_name": "HBoxView", - "_dom_classes": [], - "_model_name": "HBoxModel", - "_view_module": "@jupyter-widgets/controls", - "_model_module_version": "1.5.0", - "_view_count": null, - "_view_module_version": "1.5.0", - "box_style": "", - "layout": "IPY_MODEL_934f348be42346bca1e374cec6f7acac", - "_model_module": "@jupyter-widgets/controls", - "children": [ - "IPY_MODEL_14686b543b9349119fc7cec9c0f60963", - "IPY_MODEL_bc8fb4da9de84df6ab7605b2b7d2d32f", - "IPY_MODEL_f25f21412946491ab11381dbe23cccd1" - ] - } - }, - "934f348be42346bca1e374cec6f7acac": { - "model_module": "@jupyter-widgets/base", - "model_name": "LayoutModel", - "model_module_version": "1.2.0", - "state": { - "_view_name": "LayoutView", - "grid_template_rows": null, - "right": null, - "justify_content": null, - "_view_module": "@jupyter-widgets/base", - "overflow": null, - "_model_module_version": "1.2.0", - "_view_count": null, - "flex_flow": null, - "width": null, - "min_width": null, - "border": null, - "align_items": null, - "bottom": null, - "_model_module": "@jupyter-widgets/base", - "top": null, - "grid_column": null, - "overflow_y": null, - "overflow_x": null, - "grid_auto_flow": null, - "grid_area": null, - "grid_template_columns": null, - "flex": null, - "_model_name": "LayoutModel", - "justify_items": null, - "grid_row": null, - "max_height": null, - "align_content": null, - "visibility": null, - "align_self": null, - "height": null, - "min_height": null, - "padding": null, - "grid_auto_rows": null, - "grid_gap": null, - "max_width": null, - "order": null, - "_view_module_version": "1.2.0", - "grid_template_areas": null, - "object_position": null, - "object_fit": null, - "grid_auto_columns": null, - "margin": null, - "display": null, - "left": null - } - }, - "14686b543b9349119fc7cec9c0f60963": { - "model_module": "@jupyter-widgets/controls", - "model_name": "HTMLModel", - "model_module_version": "1.5.0", - "state": { - "_view_name": "HTMLView", - "style": "IPY_MODEL_0fedb09e3c9d4a6eb47d08e4bc013e54", - "_dom_classes": [], - "description": "", - "_model_name": "HTMLModel", - "placeholder": "​", - "_view_module": "@jupyter-widgets/controls", - "_model_module_version": "1.5.0", - "value": "100%", - "_view_count": null, - "_view_module_version": "1.5.0", - "description_tooltip": null, - "_model_module": "@jupyter-widgets/controls", - "layout": "IPY_MODEL_ad07800df53e4feba295d0202e17bba9" - } - }, - "bc8fb4da9de84df6ab7605b2b7d2d32f": { - "model_module": "@jupyter-widgets/controls", - "model_name": "FloatProgressModel", - "model_module_version": "1.5.0", - "state": { - "_view_name": "ProgressView", - "style": "IPY_MODEL_87c33c91fc584bfbbfe6ea9a61e8b1b2", - "_dom_classes": [], - "description": "", - "_model_name": "FloatProgressModel", - "bar_style": "success", - "max": 142264026, - "_view_module": "@jupyter-widgets/controls", - "_model_module_version": "1.5.0", - "value": 142264026, - "_view_count": null, - "_view_module_version": "1.5.0", - "orientation": "horizontal", - "min": 0, - "description_tooltip": null, - "_model_module": "@jupyter-widgets/controls", - "layout": "IPY_MODEL_ad8a0ff477c94faa9a9d3ed4ca8fddf3" - } - }, - "f25f21412946491ab11381dbe23cccd1": { - "model_module": "@jupyter-widgets/controls", - "model_name": "HTMLModel", - "model_module_version": "1.5.0", - "state": { - "_view_name": "HTMLView", - "style": "IPY_MODEL_7b11de7d759d490791097ef1019848f3", - "_dom_classes": [], - "description": "", - "_model_name": "HTMLModel", - "placeholder": "​", - "_view_module": "@jupyter-widgets/controls", - "_model_module_version": "1.5.0", - "value": " 136M/136M [00:01<00:00, 83.3MB/s]", - "_view_count": null, - "_view_module_version": "1.5.0", - "description_tooltip": null, - "_model_module": "@jupyter-widgets/controls", - "layout": "IPY_MODEL_ad6595b0760144d8899f6a2e1d41ed24" - } - }, - "0fedb09e3c9d4a6eb47d08e4bc013e54": { - "model_module": "@jupyter-widgets/controls", - "model_name": "DescriptionStyleModel", - "model_module_version": "1.5.0", - "state": { - "_view_name": "StyleView", - "_model_name": "DescriptionStyleModel", - "description_width": "", - "_view_module": "@jupyter-widgets/base", - "_model_module_version": "1.5.0", - "_view_count": null, - "_view_module_version": "1.2.0", - "_model_module": "@jupyter-widgets/controls" - } - }, - "ad07800df53e4feba295d0202e17bba9": { - "model_module": "@jupyter-widgets/base", - "model_name": "LayoutModel", - "model_module_version": "1.2.0", - "state": { - "_view_name": "LayoutView", - "grid_template_rows": null, - "right": null, - "justify_content": null, - "_view_module": "@jupyter-widgets/base", - "overflow": null, - "_model_module_version": "1.2.0", - "_view_count": null, - "flex_flow": null, - "width": null, - "min_width": null, - "border": null, - "align_items": null, - "bottom": null, - "_model_module": "@jupyter-widgets/base", - "top": null, - "grid_column": null, - "overflow_y": null, - "overflow_x": null, - "grid_auto_flow": null, - "grid_area": null, - "grid_template_columns": null, - "flex": null, - "_model_name": "LayoutModel", - "justify_items": null, - "grid_row": null, - "max_height": null, - "align_content": null, - "visibility": null, - "align_self": null, - "height": null, - "min_height": null, - "padding": null, - "grid_auto_rows": null, - "grid_gap": null, - "max_width": null, - "order": null, - "_view_module_version": "1.2.0", - "grid_template_areas": null, - "object_position": null, - "object_fit": null, - "grid_auto_columns": null, - "margin": null, - "display": null, - "left": null - } - }, - "87c33c91fc584bfbbfe6ea9a61e8b1b2": { - "model_module": "@jupyter-widgets/controls", - "model_name": "ProgressStyleModel", - "model_module_version": "1.5.0", - "state": { - "_view_name": "StyleView", - "_model_name": "ProgressStyleModel", - "description_width": "", - "_view_module": "@jupyter-widgets/base", - "_model_module_version": "1.5.0", - "_view_count": null, - "_view_module_version": "1.2.0", - "bar_color": null, - "_model_module": "@jupyter-widgets/controls" - } - }, - "ad8a0ff477c94faa9a9d3ed4ca8fddf3": { - "model_module": "@jupyter-widgets/base", - "model_name": "LayoutModel", - "model_module_version": "1.2.0", - "state": { - "_view_name": "LayoutView", - "grid_template_rows": null, - "right": null, - "justify_content": null, - "_view_module": "@jupyter-widgets/base", - "overflow": null, - "_model_module_version": "1.2.0", - "_view_count": null, - "flex_flow": null, - "width": null, - "min_width": null, - "border": null, - "align_items": null, - "bottom": null, - "_model_module": "@jupyter-widgets/base", - "top": null, - "grid_column": null, - "overflow_y": null, - "overflow_x": null, - "grid_auto_flow": null, - "grid_area": null, - "grid_template_columns": null, - "flex": null, - "_model_name": "LayoutModel", - "justify_items": null, - "grid_row": null, - "max_height": null, - "align_content": null, - "visibility": null, - "align_self": null, - "height": null, - "min_height": null, - "padding": null, - "grid_auto_rows": null, - "grid_gap": null, - "max_width": null, - "order": null, - "_view_module_version": "1.2.0", - "grid_template_areas": null, - "object_position": null, - "object_fit": null, - "grid_auto_columns": null, - "margin": null, - "display": null, - "left": null - } - }, - "7b11de7d759d490791097ef1019848f3": { - "model_module": "@jupyter-widgets/controls", - "model_name": "DescriptionStyleModel", - "model_module_version": "1.5.0", - "state": { - "_view_name": "StyleView", - "_model_name": "DescriptionStyleModel", - "description_width": "", - "_view_module": "@jupyter-widgets/base", - "_model_module_version": "1.5.0", - "_view_count": null, - "_view_module_version": "1.2.0", - "_model_module": "@jupyter-widgets/controls" - } - }, - "ad6595b0760144d8899f6a2e1d41ed24": { - "model_module": "@jupyter-widgets/base", - "model_name": "LayoutModel", - "model_module_version": "1.2.0", - "state": { - "_view_name": "LayoutView", - "grid_template_rows": null, - "right": null, - "justify_content": null, - "_view_module": "@jupyter-widgets/base", - "overflow": null, - "_model_module_version": "1.2.0", - "_view_count": null, - "flex_flow": null, - "width": null, - "min_width": null, - "border": null, - "align_items": null, - "bottom": null, - "_model_module": "@jupyter-widgets/base", - "top": null, - "grid_column": null, - "overflow_y": null, - "overflow_x": null, - "grid_auto_flow": null, - "grid_area": null, - "grid_template_columns": null, - "flex": null, - "_model_name": "LayoutModel", - "justify_items": null, - "grid_row": null, - "max_height": null, - "align_content": null, - "visibility": null, - "align_self": null, - "height": null, - "min_height": null, - "padding": null, - "grid_auto_rows": null, - "grid_gap": null, - "max_width": null, - "order": null, - "_view_module_version": "1.2.0", - "grid_template_areas": null, - "object_position": null, - "object_fit": null, - "grid_auto_columns": null, - "margin": null, - "display": null, - "left": null - } - } - } + "version": "3.9.7" } }, "cells": [ { "cell_type": "markdown", "metadata": { - "id": "W-1zl5XdYInf" + "id": "DphyQXreodzp" }, "source": [ - "## Practice: Question Answering with a Fine-Tuned BERT (and TTS example)\n", + "# Practice: Question Answering with a Fine-Tuned BERT (and TTS example)\n", + "\n", "This notebook is based on great [post and corresponding notebook](https://mccormickml.com/2020/03/10/question-answering-with-a-fine-tuned-BERT/) *by Chris McCormick*. It contains some minor changes and additions (especially parts 3 and 4)." ] }, @@ -396,11 +50,9 @@ "\n", "**Part 2** contains example code--we'll be downloading a model that's *already been fine-tuned* for question answering, and try it out on our own text! \n", "\n", - "For something like text classification, you definitely want to fine-tune BERT on your own dataset. For question answering, however, it seems like you may be able to get decent results using a model that's already been fine-tuned on the SQuAD benchmark. In this Notebook, we'll do exactly that, and see that it performs well on text that wasn't in the SQuAD dataset.\n", - "\n", "In **Part 3** we will apply the same approach to Russian language using the model pre-trained on SberQuAD dataset.\n", "\n", - "And in **Part 4** we will generate question and answer as audio (for now in English).\n", + "And in **Part 4** and **Part 5** we will generate question and answer as audio in english and russian languages.\n", "\n", "**Links**\n", "\n", @@ -409,632 +61,51 @@ "* The [original Colab Notebook](https://colab.research.google.com/drive/1uSlWtJdZmLrI3FCNIlUHFxwAJiSu2J0-)." ] }, - { - "cell_type": "markdown", - "metadata": { - "id": "EQ4-_Rsy7rRJ" - }, - "source": [ - "*If running on colab, uncomment the following cell*" - ] - }, - { - "cell_type": "code", - "metadata": { - "id": "-5uC3kgC7rRK", - "outputId": "7560e890-ffea-4b91-96ed-4e13f5584c0b", - "colab": { - "base_uri": "https://localhost:8080/", - "height": 1000 - } - }, - "source": [ - "!pip uninstall -y tensorflow tensorflow-gpu\n", - "!pip install numpy scipy librosa unidecode inflect librosa transformers\n", - "!pip install deeppavlov" - ], - "execution_count": 1, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Found existing installation: tensorflow 2.6.0\n", - "Uninstalling tensorflow-2.6.0:\n", - " Successfully uninstalled tensorflow-2.6.0\n", - "\u001b[33mWARNING: Skipping tensorflow-gpu as it is not installed.\u001b[0m\n", - "Requirement already satisfied: numpy in /usr/local/lib/python3.7/dist-packages (1.19.5)\n", - "Requirement already satisfied: scipy in /usr/local/lib/python3.7/dist-packages (1.4.1)\n", - "Requirement already satisfied: librosa in /usr/local/lib/python3.7/dist-packages (0.8.1)\n", - "Collecting unidecode\n", - " Downloading Unidecode-1.3.2-py3-none-any.whl (235 kB)\n", - "\u001b[K |████████████████████████████████| 235 kB 11.2 MB/s \n", - "\u001b[?25hRequirement already satisfied: inflect in /usr/local/lib/python3.7/dist-packages (2.1.0)\n", - "Collecting transformers\n", - " Downloading transformers-4.11.3-py3-none-any.whl (2.9 MB)\n", - "\u001b[K |████████████████████████████████| 2.9 MB 45.6 MB/s \n", - "\u001b[?25hRequirement already satisfied: pooch>=1.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (1.5.1)\n", - "Requirement already satisfied: scikit-learn!=0.19.0,>=0.14.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (0.22.2.post1)\n", - "Requirement already satisfied: audioread>=2.0.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (2.1.9)\n", - "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (21.0)\n", - "Requirement already satisfied: decorator>=3.0.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (4.4.2)\n", - "Requirement already satisfied: soundfile>=0.10.2 in /usr/local/lib/python3.7/dist-packages (from librosa) (0.10.3.post1)\n", - "Requirement already satisfied: joblib>=0.14 in /usr/local/lib/python3.7/dist-packages (from librosa) (1.0.1)\n", - "Requirement already satisfied: resampy>=0.2.2 in /usr/local/lib/python3.7/dist-packages (from librosa) (0.2.2)\n", - "Requirement already satisfied: numba>=0.43.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (0.51.2)\n", - "Requirement already satisfied: setuptools in /usr/local/lib/python3.7/dist-packages (from numba>=0.43.0->librosa) (57.4.0)\n", - "Requirement already satisfied: llvmlite<0.35,>=0.34.0.dev0 in /usr/local/lib/python3.7/dist-packages (from numba>=0.43.0->librosa) (0.34.0)\n", - "Requirement already satisfied: pyparsing>=2.0.2 in /usr/local/lib/python3.7/dist-packages (from packaging>=20.0->librosa) (2.4.7)\n", - "Requirement already satisfied: requests in /usr/local/lib/python3.7/dist-packages (from pooch>=1.0->librosa) (2.23.0)\n", - "Requirement already satisfied: appdirs in /usr/local/lib/python3.7/dist-packages (from pooch>=1.0->librosa) (1.4.4)\n", - "Requirement already satisfied: six>=1.3 in /usr/local/lib/python3.7/dist-packages (from resampy>=0.2.2->librosa) (1.15.0)\n", - "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.7/dist-packages (from soundfile>=0.10.2->librosa) (1.14.6)\n", - "Requirement already satisfied: pycparser in /usr/local/lib/python3.7/dist-packages (from cffi>=1.0->soundfile>=0.10.2->librosa) (2.20)\n", - "Collecting huggingface-hub>=0.0.17\n", - " Downloading huggingface_hub-0.0.19-py3-none-any.whl (56 kB)\n", - "\u001b[K |████████████████████████████████| 56 kB 4.1 MB/s \n", - "\u001b[?25hCollecting tokenizers<0.11,>=0.10.1\n", - " Downloading tokenizers-0.10.3-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (3.3 MB)\n", - "\u001b[K |████████████████████████████████| 3.3 MB 37.3 MB/s \n", - "\u001b[?25hRequirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.7/dist-packages (from transformers) (4.62.3)\n", - "Collecting pyyaml>=5.1\n", - " Downloading PyYAML-6.0-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (596 kB)\n", - "\u001b[K |████████████████████████████████| 596 kB 46.1 MB/s \n", - "\u001b[?25hRequirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.7/dist-packages (from transformers) (2019.12.20)\n", - "Collecting sacremoses\n", - " Downloading sacremoses-0.0.46-py3-none-any.whl (895 kB)\n", - "\u001b[K |████████████████████████████████| 895 kB 46.2 MB/s \n", - "\u001b[?25hRequirement already satisfied: filelock in /usr/local/lib/python3.7/dist-packages (from transformers) (3.3.0)\n", - "Requirement already satisfied: importlib-metadata in /usr/local/lib/python3.7/dist-packages (from transformers) (4.8.1)\n", - "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.7/dist-packages (from huggingface-hub>=0.0.17->transformers) (3.7.4.3)\n", - "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata->transformers) (3.6.0)\n", - "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests->pooch>=1.0->librosa) (3.0.4)\n", - "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests->pooch>=1.0->librosa) (1.24.3)\n", - "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests->pooch>=1.0->librosa) (2.10)\n", - "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests->pooch>=1.0->librosa) (2021.5.30)\n", - "Requirement already satisfied: click in /usr/local/lib/python3.7/dist-packages (from sacremoses->transformers) (7.1.2)\n", - "Installing collected packages: pyyaml, tokenizers, sacremoses, huggingface-hub, unidecode, transformers\n", - " Attempting uninstall: pyyaml\n", - " Found existing installation: PyYAML 3.13\n", - " Uninstalling PyYAML-3.13:\n", - " Successfully uninstalled PyYAML-3.13\n", - "Successfully installed huggingface-hub-0.0.19 pyyaml-6.0 sacremoses-0.0.46 tokenizers-0.10.3 transformers-4.11.3 unidecode-1.3.2\n", - "Collecting deeppavlov\n", - " Downloading deeppavlov-0.17.1-py3-none-any.whl (929 kB)\n", - "\u001b[K |████████████████████████████████| 929 kB 12.4 MB/s \n", - "\u001b[?25hCollecting fastapi==0.47.1\n", - " Downloading fastapi-0.47.1-py3-none-any.whl (43 kB)\n", - "\u001b[K |████████████████████████████████| 43 kB 1.8 MB/s \n", - "\u001b[?25hCollecting pytelegrambotapi==3.6.7\n", - " Downloading pyTelegramBotAPI-3.6.7.tar.gz (65 kB)\n", - "\u001b[K |████████████████████████████████| 65 kB 4.3 MB/s \n", - "\u001b[?25hCollecting uvicorn==0.11.7\n", - " Downloading uvicorn-0.11.7-py3-none-any.whl (43 kB)\n", - "\u001b[K |████████████████████████████████| 43 kB 1.9 MB/s \n", - "\u001b[?25hCollecting overrides==2.7.0\n", - " Downloading overrides-2.7.0.tar.gz (4.5 kB)\n", - "Collecting uvloop==0.14.0\n", - " Downloading uvloop-0.14.0-cp37-cp37m-manylinux2010_x86_64.whl (3.8 MB)\n", - "\u001b[K |████████████████████████████████| 3.8 MB 33.7 MB/s \n", - "\u001b[?25hCollecting pandas==0.25.3\n", - " Downloading pandas-0.25.3-cp37-cp37m-manylinux1_x86_64.whl (10.4 MB)\n", - "\u001b[K |████████████████████████████████| 10.4 MB 47.3 MB/s \n", - "\u001b[?25hCollecting requests==2.22.0\n", - " Downloading requests-2.22.0-py2.py3-none-any.whl (57 kB)\n", - "\u001b[K |████████████████████████████████| 57 kB 5.1 MB/s \n", - "\u001b[?25hCollecting sacremoses==0.0.35\n", - " Downloading sacremoses-0.0.35.tar.gz (859 kB)\n", - "\u001b[K |████████████████████████████████| 859 kB 54.4 MB/s \n", - "\u001b[?25hCollecting pydantic==1.3\n", - " Downloading pydantic-1.3-cp37-cp37m-manylinux2010_x86_64.whl (7.3 MB)\n", - "\u001b[K |████████████████████████████████| 7.3 MB 24.8 MB/s \n", - "\u001b[?25hCollecting scikit-learn==0.21.2\n", - " Downloading scikit_learn-0.21.2-cp37-cp37m-manylinux1_x86_64.whl (6.7 MB)\n", - "\u001b[K |████████████████████████████████| 6.7 MB 17.7 MB/s \n", - "\u001b[?25hCollecting pytz==2019.1\n", - " Downloading pytz-2019.1-py2.py3-none-any.whl (510 kB)\n", - "\u001b[K |████████████████████████████████| 510 kB 50.0 MB/s \n", - "\u001b[?25hCollecting h5py==2.10.0\n", - " Downloading h5py-2.10.0-cp37-cp37m-manylinux1_x86_64.whl (2.9 MB)\n", - "\u001b[K |████████████████████████████████| 2.9 MB 47.0 MB/s \n", - "\u001b[?25hRequirement already satisfied: scipy==1.4.1 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (1.4.1)\n", - "Collecting tqdm==4.62.0\n", - " Downloading tqdm-4.62.0-py2.py3-none-any.whl (76 kB)\n", - "\u001b[K |████████████████████████████████| 76 kB 4.1 MB/s \n", - "\u001b[?25hCollecting filelock==3.0.12\n", - " Downloading filelock-3.0.12-py3-none-any.whl (7.6 kB)\n", - "Collecting pyopenssl==19.1.0\n", - " Downloading pyOpenSSL-19.1.0-py2.py3-none-any.whl (53 kB)\n", - "\u001b[K |████████████████████████████████| 53 kB 2.2 MB/s \n", - "\u001b[?25hCollecting nltk==3.4.5\n", - " Downloading nltk-3.4.5.zip (1.5 MB)\n", - "\u001b[K |████████████████████████████████| 1.5 MB 41.5 MB/s \n", - "\u001b[?25hCollecting aio-pika==6.4.1\n", - " Downloading aio_pika-6.4.1-py3-none-any.whl (40 kB)\n", - "\u001b[K |████████████████████████████████| 40 kB 18 kB/s \n", - "\u001b[?25hCollecting ruamel.yaml==0.15.100\n", - " Downloading ruamel.yaml-0.15.100-cp37-cp37m-manylinux1_x86_64.whl (654 kB)\n", - "\u001b[K |████████████████████████████████| 654 kB 39.6 MB/s \n", - "\u001b[?25hCollecting prometheus-client==0.7.1\n", - " Downloading prometheus_client-0.7.1.tar.gz (38 kB)\n", - "Requirement already satisfied: click==7.1.2 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (7.1.2)\n", - "Collecting pymorphy2-dicts-ru\n", - " Downloading pymorphy2_dicts_ru-2.4.417127.4579844-py2.py3-none-any.whl (8.2 MB)\n", - "\u001b[K |████████████████████████████████| 8.2 MB 22.3 MB/s \n", - "\u001b[?25hCollecting Cython==0.29.14\n", - " Downloading Cython-0.29.14-cp37-cp37m-manylinux1_x86_64.whl (2.1 MB)\n", - "\u001b[K |████████████████████████████████| 2.1 MB 42.2 MB/s \n", - "\u001b[?25hCollecting rusenttokenize==0.0.5\n", - " Downloading rusenttokenize-0.0.5-py3-none-any.whl (10 kB)\n", - "Collecting pymorphy2==0.8\n", - " Downloading pymorphy2-0.8-py2.py3-none-any.whl (46 kB)\n", - "\u001b[K |████████████████████████████████| 46 kB 3.4 MB/s \n", - "\u001b[?25hCollecting numpy==1.18.0\n", - " Downloading numpy-1.18.0-cp37-cp37m-manylinux1_x86_64.whl (20.1 MB)\n", - "\u001b[K |████████████████████████████████| 20.1 MB 53.8 MB/s \n", - "\u001b[?25hCollecting yarl\n", - " Downloading yarl-1.7.0-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (271 kB)\n", - "\u001b[K |████████████████████████████████| 271 kB 51.7 MB/s \n", - "\u001b[?25hCollecting aiormq<4,>=3.2.0\n", - " Downloading aiormq-3.3.1-py3-none-any.whl (28 kB)\n", - "Collecting starlette<=0.12.9,>=0.12.9\n", - " Downloading starlette-0.12.9.tar.gz (46 kB)\n", - "\u001b[K |████████████████████████████████| 46 kB 3.2 MB/s \n", - "\u001b[?25hRequirement already satisfied: six in /usr/local/lib/python3.7/dist-packages (from h5py==2.10.0->deeppavlov) (1.15.0)\n", - "Requirement already satisfied: python-dateutil>=2.6.1 in /usr/local/lib/python3.7/dist-packages (from pandas==0.25.3->deeppavlov) (2.8.2)\n", - "Collecting dawg-python>=0.7\n", - " Downloading DAWG_Python-0.7.2-py2.py3-none-any.whl (11 kB)\n", - "Requirement already satisfied: docopt>=0.6 in /usr/local/lib/python3.7/dist-packages (from pymorphy2==0.8->deeppavlov) (0.6.2)\n", - "Collecting pymorphy2-dicts<3.0,>=2.4\n", - " Downloading pymorphy2_dicts-2.4.393442.3710985-py2.py3-none-any.whl (7.1 MB)\n", - "\u001b[K |████████████████████████████████| 7.1 MB 24.1 MB/s \n", - "\u001b[?25hCollecting cryptography>=2.8\n", - " Downloading cryptography-35.0.0-cp36-abi3-manylinux_2_24_x86_64.whl (3.5 MB)\n", - "\u001b[K |████████████████████████████████| 3.5 MB 41.5 MB/s \n", - "\u001b[?25hCollecting idna<2.9,>=2.5\n", - " Downloading idna-2.8-py2.py3-none-any.whl (58 kB)\n", - "\u001b[K |████████████████████████████████| 58 kB 6.1 MB/s \n", - "\u001b[?25hRequirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests==2.22.0->deeppavlov) (1.24.3)\n", - "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests==2.22.0->deeppavlov) (2021.5.30)\n", - "Requirement already satisfied: chardet<3.1.0,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests==2.22.0->deeppavlov) (3.0.4)\n", - "Requirement already satisfied: joblib in /usr/local/lib/python3.7/dist-packages (from sacremoses==0.0.35->deeppavlov) (1.0.1)\n", - "Collecting httptools==0.1.*\n", - " Downloading httptools-0.1.2-cp37-cp37m-manylinux1_x86_64.whl (219 kB)\n", - "\u001b[K |████████████████████████████████| 219 kB 32.7 MB/s \n", - "\u001b[?25hCollecting h11<0.10,>=0.8\n", - " Downloading h11-0.9.0-py2.py3-none-any.whl (53 kB)\n", - "\u001b[K |████████████████████████████████| 53 kB 2.2 MB/s \n", - "\u001b[?25hCollecting websockets==8.*\n", - " Downloading websockets-8.1-cp37-cp37m-manylinux2010_x86_64.whl (79 kB)\n", - "\u001b[K |████████████████████████████████| 79 kB 7.8 MB/s \n", - "\u001b[?25hCollecting pamqp==2.3.0\n", - " Downloading pamqp-2.3.0-py2.py3-none-any.whl (28 kB)\n", - "Requirement already satisfied: cffi>=1.12 in /usr/local/lib/python3.7/dist-packages (from cryptography>=2.8->pyopenssl==19.1.0->deeppavlov) (1.14.6)\n", - "Requirement already satisfied: pycparser in /usr/local/lib/python3.7/dist-packages (from cffi>=1.12->cryptography>=2.8->pyopenssl==19.1.0->deeppavlov) (2.20)\n", - "Requirement already satisfied: typing-extensions>=3.7.4 in /usr/local/lib/python3.7/dist-packages (from yarl->aio-pika==6.4.1->deeppavlov) (3.7.4.3)\n", - "Collecting multidict>=4.0\n", - " Downloading multidict-5.2.0-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (160 kB)\n", - "\u001b[K |████████████████████████████████| 160 kB 49.6 MB/s \n", - "\u001b[?25hBuilding wheels for collected packages: nltk, overrides, prometheus-client, pytelegrambotapi, sacremoses, starlette\n", - " Building wheel for nltk (setup.py) ... \u001b[?25l\u001b[?25hdone\n", - " Created wheel for nltk: filename=nltk-3.4.5-py3-none-any.whl size=1449922 sha256=b535ba891e5af09414ccded1641b6e86ca64e8d3e8219d9cb8f0ba15872f83af\n", - " Stored in directory: /root/.cache/pip/wheels/48/8b/7f/473521e0c731c6566d631b281f323842bbda9bd819eb9a3ead\n", - " Building wheel for overrides (setup.py) ... \u001b[?25l\u001b[?25hdone\n", - " Created wheel for overrides: filename=overrides-2.7.0-py3-none-any.whl size=5605 sha256=f35d81cf19d4ea2d5df0e1979e861ab029240bf285e1fff1e58b2e04d356cca9\n", - " Stored in directory: /root/.cache/pip/wheels/c9/87/45/bfdacf6c3b8233b6e8d519edcbd1cf297ad5ff5f0bf84bb9c1\n", - " Building wheel for prometheus-client (setup.py) ... \u001b[?25l\u001b[?25hdone\n", - " Created wheel for prometheus-client: filename=prometheus_client-0.7.1-py3-none-any.whl size=41404 sha256=78963bdfe71b742101d3fc6aade52c3de5465dbc90d2ae272f728e1e56ca010c\n", - " Stored in directory: /root/.cache/pip/wheels/30/0c/26/59ba285bf65dc79d195e9b25e2ddde4c61070422729b0cd914\n", - " Building wheel for pytelegrambotapi (setup.py) ... \u001b[?25l\u001b[?25hdone\n", - " Created wheel for pytelegrambotapi: filename=pyTelegramBotAPI-3.6.7-py3-none-any.whl size=47176 sha256=8067d09e771447680123cd23fdded8909a014c3b8aa5c9e4a569f7d5e9e62eb1\n", - " Stored in directory: /root/.cache/pip/wheels/7f/7c/54/8eddf2369ef1b9190e2ee6dc2b40df54b6c65529a38790fdd4\n", - " Building wheel for sacremoses (setup.py) ... \u001b[?25l\u001b[?25hdone\n", - " Created wheel for sacremoses: filename=sacremoses-0.0.35-py3-none-any.whl size=883989 sha256=1a5b249c82615565091d0ec58a31c47612d7a54454a17a7ee640ce35ba93cbc9\n", - " Stored in directory: /root/.cache/pip/wheels/d1/ff/0e/e00ff1e22100702ac8b24e709551ae0fb29db9ffc843510a64\n", - " Building wheel for starlette (setup.py) ... \u001b[?25l\u001b[?25hdone\n", - " Created wheel for starlette: filename=starlette-0.12.9-py3-none-any.whl size=57251 sha256=bfa1618898c82f0be44db86e36f0a0e360ac6dcc41818d9bb614c8f46526f307\n", - " Stored in directory: /root/.cache/pip/wheels/e8/78/be/f57ed5aed7cd222abdb24e3186b5c9f1074184fcc0a295102b\n", - "Successfully built nltk overrides prometheus-client pytelegrambotapi sacremoses starlette\n", - "Installing collected packages: multidict, idna, yarl, pamqp, numpy, websockets, uvloop, tqdm, starlette, requests, pytz, pymorphy2-dicts, pydantic, httptools, h11, dawg-python, cryptography, aiormq, uvicorn, scikit-learn, sacremoses, rusenttokenize, ruamel.yaml, pytelegrambotapi, pyopenssl, pymorphy2-dicts-ru, pymorphy2, prometheus-client, pandas, overrides, nltk, h5py, filelock, fastapi, Cython, aio-pika, deeppavlov\n", - " Attempting uninstall: idna\n", - " Found existing installation: idna 2.10\n", - " Uninstalling idna-2.10:\n", - " Successfully uninstalled idna-2.10\n", - " Attempting uninstall: numpy\n", - " Found existing installation: numpy 1.19.5\n", - " Uninstalling numpy-1.19.5:\n", - " Successfully uninstalled numpy-1.19.5\n", - " Attempting uninstall: tqdm\n", - " Found existing installation: tqdm 4.62.3\n", - " Uninstalling tqdm-4.62.3:\n", - " Successfully uninstalled tqdm-4.62.3\n", - " Attempting uninstall: requests\n", - " Found existing installation: requests 2.23.0\n", - " Uninstalling requests-2.23.0:\n", - " Successfully uninstalled requests-2.23.0\n", - " Attempting uninstall: pytz\n", - " Found existing installation: pytz 2018.9\n", - " Uninstalling pytz-2018.9:\n", - " Successfully uninstalled pytz-2018.9\n", - " Attempting uninstall: scikit-learn\n", - " Found existing installation: scikit-learn 0.22.2.post1\n", - " Uninstalling scikit-learn-0.22.2.post1:\n", - " Successfully uninstalled scikit-learn-0.22.2.post1\n", - " Attempting uninstall: sacremoses\n", - " Found existing installation: sacremoses 0.0.46\n", - " Uninstalling sacremoses-0.0.46:\n", - " Successfully uninstalled sacremoses-0.0.46\n", - " Attempting uninstall: prometheus-client\n", - " Found existing installation: prometheus-client 0.11.0\n", - " Uninstalling prometheus-client-0.11.0:\n", - " Successfully uninstalled prometheus-client-0.11.0\n", - " Attempting uninstall: pandas\n", - " Found existing installation: pandas 1.1.5\n", - " Uninstalling pandas-1.1.5:\n", - " Successfully uninstalled pandas-1.1.5\n", - " Attempting uninstall: nltk\n", - " Found existing installation: nltk 3.2.5\n", - " Uninstalling nltk-3.2.5:\n", - " Successfully uninstalled nltk-3.2.5\n", - " Attempting uninstall: h5py\n", - " Found existing installation: h5py 3.1.0\n", - " Uninstalling h5py-3.1.0:\n", - " Successfully uninstalled h5py-3.1.0\n", - " Attempting uninstall: filelock\n", - " Found existing installation: filelock 3.3.0\n", - " Uninstalling filelock-3.3.0:\n", - " Successfully uninstalled filelock-3.3.0\n", - " Attempting uninstall: Cython\n", - " Found existing installation: Cython 0.29.24\n", - " Uninstalling Cython-0.29.24:\n", - " Successfully uninstalled Cython-0.29.24\n", - "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n", - "kapre 0.3.5 requires tensorflow>=2.0.0, which is not installed.\n", - "xarray 0.18.2 requires pandas>=1.0, but you have pandas 0.25.3 which is incompatible.\n", - "kapre 0.3.5 requires numpy>=1.18.5, but you have numpy 1.18.0 which is incompatible.\n", - "google-colab 1.0.0 requires pandas~=1.1.0; python_version >= \"3.0\", but you have pandas 0.25.3 which is incompatible.\n", - "google-colab 1.0.0 requires requests~=2.23.0, but you have requests 2.22.0 which is incompatible.\n", - "fbprophet 0.7.1 requires pandas>=1.0.4, but you have pandas 0.25.3 which is incompatible.\n", - "datascience 0.10.6 requires folium==0.2.1, but you have folium 0.8.3 which is incompatible.\n", - "albumentations 0.1.12 requires imgaug<0.2.7,>=0.2.5, but you have imgaug 0.2.9 which is incompatible.\u001b[0m\n", - "Successfully installed Cython-0.29.14 aio-pika-6.4.1 aiormq-3.3.1 cryptography-35.0.0 dawg-python-0.7.2 deeppavlov-0.17.1 fastapi-0.47.1 filelock-3.0.12 h11-0.9.0 h5py-2.10.0 httptools-0.1.2 idna-2.8 multidict-5.2.0 nltk-3.4.5 numpy-1.18.0 overrides-2.7.0 pamqp-2.3.0 pandas-0.25.3 prometheus-client-0.7.1 pydantic-1.3 pymorphy2-0.8 pymorphy2-dicts-2.4.393442.3710985 pymorphy2-dicts-ru-2.4.417127.4579844 pyopenssl-19.1.0 pytelegrambotapi-3.6.7 pytz-2019.1 requests-2.22.0 ruamel.yaml-0.15.100 rusenttokenize-0.0.5 sacremoses-0.0.35 scikit-learn-0.21.2 starlette-0.12.9 tqdm-4.62.0 uvicorn-0.11.7 uvloop-0.14.0 websockets-8.1 yarl-1.7.0\n" - ] - }, - { - "output_type": "display_data", - "data": { - "application/vnd.colab-display-data+json": { - "pip_warning": { - "packages": [ - "numpy", - "pandas", - "pytz" - ] - } - } - }, - "metadata": {} - } - ] - }, - { - "cell_type": "code", - "metadata": { - "id": "8u4iQePy7rRL", - "outputId": "ef608de1-efd4-46d5-eb90-081a44c53fde", - "colab": { - "base_uri": "https://localhost:8080/" - } - }, - "source": [ - "!python -m deeppavlov install squad_ru_rubert" - ], - "execution_count": 2, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "2021-10-14 22:33:40.165 INFO in 'deeppavlov.core.common.file'['file'] at line 32: Interpreting 'squad_ru_rubert' as '/usr/local/lib/python3.7/dist-packages/deeppavlov/configs/squad/squad_ru_rubert.json'\n", - "Collecting git+https://github.com/deepmipt/bert.git@feat/multi_gpu\n", - " Cloning https://github.com/deepmipt/bert.git (to revision feat/multi_gpu) to /tmp/pip-req-build-ftxsdnuo\n", - " Running command git clone -q https://github.com/deepmipt/bert.git /tmp/pip-req-build-ftxsdnuo\n", - "Building wheels for collected packages: bert-dp\n", - " Building wheel for bert-dp (setup.py) ... \u001b[?25l\u001b[?25hdone\n", - " Created wheel for bert-dp: filename=bert_dp-1.0-py3-none-any.whl size=23591 sha256=13ea88229fd57bab42fb565a3b7f876500637c40b390c4ee78bb0bcf23a25756\n", - " Stored in directory: /tmp/pip-ephem-wheel-cache-x4j2jdpe/wheels/44/29/b2/ee614cb7f97ba5c2d220029eaede3af4b74331ad31d6e2f4eb\n", - "Successfully built bert-dp\n", - "Installing collected packages: bert-dp\n", - "Successfully installed bert-dp-1.0\n", - "Collecting tensorflow==1.15.5\n", - " Downloading tensorflow-1.15.5-cp37-cp37m-manylinux2010_x86_64.whl (110.5 MB)\n", - "\u001b[K |████████████████████████████████| 110.5 MB 753 bytes/s \n", - "\u001b[?25hRequirement already satisfied: wheel>=0.26 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (0.37.0)\n", - "Requirement already satisfied: absl-py>=0.7.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (0.12.0)\n", - "Requirement already satisfied: protobuf>=3.6.1 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (3.17.3)\n", - "Collecting keras-applications>=1.0.8\n", - " Downloading Keras_Applications-1.0.8-py3-none-any.whl (50 kB)\n", - "\u001b[K |████████████████████████████████| 50 kB 6.3 MB/s \n", - "\u001b[?25hRequirement already satisfied: opt-einsum>=2.3.2 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (3.3.0)\n", - "Requirement already satisfied: h5py<=2.10.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (2.10.0)\n", - "Requirement already satisfied: six>=1.10.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (1.15.0)\n", - "Collecting tensorflow-estimator==1.15.1\n", - " Downloading tensorflow_estimator-1.15.1-py2.py3-none-any.whl (503 kB)\n", - "\u001b[K |████████████████████████████████| 503 kB 43.5 MB/s \n", - "\u001b[?25hCollecting tensorboard<1.16.0,>=1.15.0\n", - " Downloading tensorboard-1.15.0-py3-none-any.whl (3.8 MB)\n", - "\u001b[K |████████████████████████████████| 3.8 MB 40.9 MB/s \n", - "\u001b[?25hRequirement already satisfied: google-pasta>=0.1.6 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (0.2.0)\n", - "Requirement already satisfied: grpcio>=1.8.6 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (1.41.0)\n", - "Requirement already satisfied: wrapt>=1.11.1 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (1.12.1)\n", - "Requirement already satisfied: termcolor>=1.1.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (1.1.0)\n", - "Requirement already satisfied: keras-preprocessing>=1.0.5 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (1.1.2)\n", - "Requirement already satisfied: astor>=0.6.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (0.8.1)\n", - "Collecting gast==0.2.2\n", - " Downloading gast-0.2.2.tar.gz (10 kB)\n", - "Requirement already satisfied: numpy<1.19.0,>=1.16.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15.5) (1.18.0)\n", - "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.7/dist-packages (from tensorboard<1.16.0,>=1.15.0->tensorflow==1.15.5) (3.3.4)\n", - "Requirement already satisfied: setuptools>=41.0.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard<1.16.0,>=1.15.0->tensorflow==1.15.5) (57.4.0)\n", - "Requirement already satisfied: werkzeug>=0.11.15 in /usr/local/lib/python3.7/dist-packages (from tensorboard<1.16.0,>=1.15.0->tensorflow==1.15.5) (1.0.1)\n", - "Requirement already satisfied: importlib-metadata in /usr/local/lib/python3.7/dist-packages (from markdown>=2.6.8->tensorboard<1.16.0,>=1.15.0->tensorflow==1.15.5) (4.8.1)\n", - "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata->markdown>=2.6.8->tensorboard<1.16.0,>=1.15.0->tensorflow==1.15.5) (3.6.0)\n", - "Requirement already satisfied: typing-extensions>=3.6.4 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata->markdown>=2.6.8->tensorboard<1.16.0,>=1.15.0->tensorflow==1.15.5) (3.7.4.3)\n", - "Building wheels for collected packages: gast\n", - " Building wheel for gast (setup.py) ... \u001b[?25l\u001b[?25hdone\n", - " Created wheel for gast: filename=gast-0.2.2-py3-none-any.whl size=7554 sha256=06dac371e24c972318370b7d71a23cf99c25c4525fe1be144e4984a9d32082d6\n", - " Stored in directory: /root/.cache/pip/wheels/21/7f/02/420f32a803f7d0967b48dd823da3f558c5166991bfd204eef3\n", - "Successfully built gast\n", - "Installing collected packages: tensorflow-estimator, tensorboard, keras-applications, gast, tensorflow\n", - " Attempting uninstall: tensorflow-estimator\n", - " Found existing installation: tensorflow-estimator 2.6.0\n", - " Uninstalling tensorflow-estimator-2.6.0:\n", - " Successfully uninstalled tensorflow-estimator-2.6.0\n", - " Attempting uninstall: tensorboard\n", - " Found existing installation: tensorboard 2.6.0\n", - " Uninstalling tensorboard-2.6.0:\n", - " Successfully uninstalled tensorboard-2.6.0\n", - " Attempting uninstall: gast\n", - " Found existing installation: gast 0.4.0\n", - " Uninstalling gast-0.4.0:\n", - " Successfully uninstalled gast-0.4.0\n", - "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n", - "tensorflow-probability 0.14.1 requires gast>=0.3.2, but you have gast 0.2.2 which is incompatible.\n", - "kapre 0.3.5 requires numpy>=1.18.5, but you have numpy 1.18.0 which is incompatible.\n", - "kapre 0.3.5 requires tensorflow>=2.0.0, but you have tensorflow 1.15.5 which is incompatible.\u001b[0m\n", - "Successfully installed gast-0.2.2 keras-applications-1.0.8 tensorboard-1.15.0 tensorflow-1.15.5 tensorflow-estimator-1.15.1\n" - ] - } - ] - }, { "cell_type": "code", "metadata": { - "id": "r9oKlEV07rRM", - "outputId": "ef207053-3ed9-4e8a-9bbf-3f6d52168206", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "-5uC3kgC7rRK" }, "source": [ - "!pip install numpy scipy librosa unidecode inflect librosa transformers\n", - "!pip install deeppavlov" + "!pip install -U transformers deeppavlov unidecode omegaconf\n", + "!python -m deeppavlov install squad_ru_rubert\n", + "\n", + "# Pre-downloading the BERT for Russian language. Same result can be achieved with\n", + "# `!python -m deeppavlov download squad_ru_rubert`\n", + "# But it works significantly slower.\n", + "!wget -nc https://www.dropbox.com/s/7za1o6vaffbdlcg/rubert_cased_L-12_H-768_A-12_v1.tar.gz\n", + "!mkdir -p /root/.deeppavlov/downloads/bert_models/\n", + "!tar -xzvf rubert_cased_L-12_H-768_A-12_v1.tar.gz -C /root/.deeppavlov/downloads/bert_models\n", + "\n", + "!wget -nc https://www.dropbox.com/s/ns8280pd9t9n9dc/squad_model_ru_rubert.tar.gz\n", + "!mkdir -p /root/.deeppavlov/models/\n", + "!tar -xzvf squad_model_ru_rubert.tar.gz -C /root/.deeppavlov/models" ], - "execution_count": 3, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Requirement already satisfied: numpy in /usr/local/lib/python3.7/dist-packages (1.18.0)\n", - "Requirement already satisfied: scipy in /usr/local/lib/python3.7/dist-packages (1.4.1)\n", - "Requirement already satisfied: librosa in /usr/local/lib/python3.7/dist-packages (0.8.1)\n", - "Requirement already satisfied: unidecode in /usr/local/lib/python3.7/dist-packages (1.3.2)\n", - "Requirement already satisfied: inflect in /usr/local/lib/python3.7/dist-packages (2.1.0)\n", - "Requirement already satisfied: transformers in /usr/local/lib/python3.7/dist-packages (4.11.3)\n", - "Requirement already satisfied: resampy>=0.2.2 in /usr/local/lib/python3.7/dist-packages (from librosa) (0.2.2)\n", - "Requirement already satisfied: numba>=0.43.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (0.51.2)\n", - "Requirement already satisfied: joblib>=0.14 in /usr/local/lib/python3.7/dist-packages (from librosa) (1.0.1)\n", - "Requirement already satisfied: scikit-learn!=0.19.0,>=0.14.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (0.21.2)\n", - "Requirement already satisfied: audioread>=2.0.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (2.1.9)\n", - "Requirement already satisfied: soundfile>=0.10.2 in /usr/local/lib/python3.7/dist-packages (from librosa) (0.10.3.post1)\n", - "Requirement already satisfied: pooch>=1.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (1.5.1)\n", - "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (21.0)\n", - "Requirement already satisfied: decorator>=3.0.0 in /usr/local/lib/python3.7/dist-packages (from librosa) (4.4.2)\n", - "Requirement already satisfied: setuptools in /usr/local/lib/python3.7/dist-packages (from numba>=0.43.0->librosa) (57.4.0)\n", - "Requirement already satisfied: llvmlite<0.35,>=0.34.0.dev0 in /usr/local/lib/python3.7/dist-packages (from numba>=0.43.0->librosa) (0.34.0)\n", - "Requirement already satisfied: pyparsing>=2.0.2 in /usr/local/lib/python3.7/dist-packages (from packaging>=20.0->librosa) (2.4.7)\n", - "Requirement already satisfied: requests in /usr/local/lib/python3.7/dist-packages (from pooch>=1.0->librosa) (2.22.0)\n", - "Requirement already satisfied: appdirs in /usr/local/lib/python3.7/dist-packages (from pooch>=1.0->librosa) (1.4.4)\n", - "Requirement already satisfied: six>=1.3 in /usr/local/lib/python3.7/dist-packages (from resampy>=0.2.2->librosa) (1.15.0)\n", - "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.7/dist-packages (from soundfile>=0.10.2->librosa) (1.14.6)\n", - "Requirement already satisfied: pycparser in /usr/local/lib/python3.7/dist-packages (from cffi>=1.0->soundfile>=0.10.2->librosa) (2.20)\n", - "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.7/dist-packages (from transformers) (2019.12.20)\n", - "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.7/dist-packages (from transformers) (4.62.0)\n", - "Requirement already satisfied: importlib-metadata in /usr/local/lib/python3.7/dist-packages (from transformers) (4.8.1)\n", - "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.7/dist-packages (from transformers) (6.0)\n", - "Requirement already satisfied: tokenizers<0.11,>=0.10.1 in /usr/local/lib/python3.7/dist-packages (from transformers) (0.10.3)\n", - "Requirement already satisfied: huggingface-hub>=0.0.17 in /usr/local/lib/python3.7/dist-packages (from transformers) (0.0.19)\n", - "Requirement already satisfied: filelock in /usr/local/lib/python3.7/dist-packages (from transformers) (3.0.12)\n", - "Requirement already satisfied: sacremoses in /usr/local/lib/python3.7/dist-packages (from transformers) (0.0.35)\n", - "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.7/dist-packages (from huggingface-hub>=0.0.17->transformers) (3.7.4.3)\n", - "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata->transformers) (3.6.0)\n", - "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests->pooch>=1.0->librosa) (2021.5.30)\n", - "Requirement already satisfied: idna<2.9,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests->pooch>=1.0->librosa) (2.8)\n", - "Requirement already satisfied: chardet<3.1.0,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests->pooch>=1.0->librosa) (3.0.4)\n", - "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests->pooch>=1.0->librosa) (1.24.3)\n", - "Requirement already satisfied: click in /usr/local/lib/python3.7/dist-packages (from sacremoses->transformers) (7.1.2)\n", - "Requirement already satisfied: deeppavlov in /usr/local/lib/python3.7/dist-packages (0.17.1)\n", - "Requirement already satisfied: prometheus-client==0.7.1 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.7.1)\n", - "Requirement already satisfied: pytz==2019.1 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (2019.1)\n", - "Requirement already satisfied: uvloop==0.14.0 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.14.0)\n", - "Requirement already satisfied: pyopenssl==19.1.0 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (19.1.0)\n", - "Requirement already satisfied: fastapi==0.47.1 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.47.1)\n", - "Requirement already satisfied: h5py==2.10.0 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (2.10.0)\n", - "Requirement already satisfied: click==7.1.2 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (7.1.2)\n", - "Requirement already satisfied: pymorphy2==0.8 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.8)\n", - "Requirement already satisfied: tqdm==4.62.0 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (4.62.0)\n", - "Requirement already satisfied: ruamel.yaml==0.15.100 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.15.100)\n", - "Requirement already satisfied: numpy==1.18.0 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (1.18.0)\n", - "Requirement already satisfied: aio-pika==6.4.1 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (6.4.1)\n", - "Requirement already satisfied: pytelegrambotapi==3.6.7 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (3.6.7)\n", - "Requirement already satisfied: filelock==3.0.12 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (3.0.12)\n", - "Requirement already satisfied: uvicorn==0.11.7 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.11.7)\n", - "Requirement already satisfied: sacremoses==0.0.35 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.0.35)\n", - "Requirement already satisfied: scikit-learn==0.21.2 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.21.2)\n", - "Requirement already satisfied: requests==2.22.0 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (2.22.0)\n", - "Requirement already satisfied: rusenttokenize==0.0.5 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.0.5)\n", - "Requirement already satisfied: nltk==3.4.5 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (3.4.5)\n", - "Requirement already satisfied: Cython==0.29.14 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.29.14)\n", - "Requirement already satisfied: overrides==2.7.0 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (2.7.0)\n", - "Requirement already satisfied: pandas==0.25.3 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (0.25.3)\n", - "Requirement already satisfied: scipy==1.4.1 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (1.4.1)\n", - "Requirement already satisfied: pydantic==1.3 in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (1.3)\n", - "Requirement already satisfied: pymorphy2-dicts-ru in /usr/local/lib/python3.7/dist-packages (from deeppavlov) (2.4.417127.4579844)\n", - "Requirement already satisfied: aiormq<4,>=3.2.0 in /usr/local/lib/python3.7/dist-packages (from aio-pika==6.4.1->deeppavlov) (3.3.1)\n", - "Requirement already satisfied: yarl in /usr/local/lib/python3.7/dist-packages (from aio-pika==6.4.1->deeppavlov) (1.7.0)\n", - "Requirement already satisfied: starlette<=0.12.9,>=0.12.9 in /usr/local/lib/python3.7/dist-packages (from fastapi==0.47.1->deeppavlov) (0.12.9)\n", - "Requirement already satisfied: six in /usr/local/lib/python3.7/dist-packages (from h5py==2.10.0->deeppavlov) (1.15.0)\n", - "Requirement already satisfied: python-dateutil>=2.6.1 in /usr/local/lib/python3.7/dist-packages (from pandas==0.25.3->deeppavlov) (2.8.2)\n", - "Requirement already satisfied: docopt>=0.6 in /usr/local/lib/python3.7/dist-packages (from pymorphy2==0.8->deeppavlov) (0.6.2)\n", - "Requirement already satisfied: dawg-python>=0.7 in /usr/local/lib/python3.7/dist-packages (from pymorphy2==0.8->deeppavlov) (0.7.2)\n", - "Requirement already satisfied: pymorphy2-dicts<3.0,>=2.4 in /usr/local/lib/python3.7/dist-packages (from pymorphy2==0.8->deeppavlov) (2.4.393442.3710985)\n", - "Requirement already satisfied: cryptography>=2.8 in /usr/local/lib/python3.7/dist-packages (from pyopenssl==19.1.0->deeppavlov) (35.0.0)\n", - "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests==2.22.0->deeppavlov) (2021.5.30)\n", - "Requirement already satisfied: idna<2.9,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests==2.22.0->deeppavlov) (2.8)\n", - "Requirement already satisfied: chardet<3.1.0,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests==2.22.0->deeppavlov) (3.0.4)\n", - "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests==2.22.0->deeppavlov) (1.24.3)\n", - "Requirement already satisfied: joblib in /usr/local/lib/python3.7/dist-packages (from sacremoses==0.0.35->deeppavlov) (1.0.1)\n", - "Requirement already satisfied: h11<0.10,>=0.8 in /usr/local/lib/python3.7/dist-packages (from uvicorn==0.11.7->deeppavlov) (0.9.0)\n", - "Requirement already satisfied: httptools==0.1.* in /usr/local/lib/python3.7/dist-packages (from uvicorn==0.11.7->deeppavlov) (0.1.2)\n", - "Requirement already satisfied: websockets==8.* in /usr/local/lib/python3.7/dist-packages (from uvicorn==0.11.7->deeppavlov) (8.1)\n", - "Requirement already satisfied: pamqp==2.3.0 in /usr/local/lib/python3.7/dist-packages (from aiormq<4,>=3.2.0->aio-pika==6.4.1->deeppavlov) (2.3.0)\n", - "Requirement already satisfied: cffi>=1.12 in /usr/local/lib/python3.7/dist-packages (from cryptography>=2.8->pyopenssl==19.1.0->deeppavlov) (1.14.6)\n", - "Requirement already satisfied: pycparser in /usr/local/lib/python3.7/dist-packages (from cffi>=1.12->cryptography>=2.8->pyopenssl==19.1.0->deeppavlov) (2.20)\n", - "Requirement already satisfied: multidict>=4.0 in /usr/local/lib/python3.7/dist-packages (from yarl->aio-pika==6.4.1->deeppavlov) (5.2.0)\n", - "Requirement already satisfied: typing-extensions>=3.7.4 in /usr/local/lib/python3.7/dist-packages (from yarl->aio-pika==6.4.1->deeppavlov) (3.7.4.3)\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "code", "metadata": { - "id": "OfzJwB_17rRM", - "outputId": "7343c565-8604-49db-eef6-1b41d0a2df59", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "OfzJwB_17rRM" }, "source": [ "import torch\n", - "if torch.cuda.is_available():\n", - " device = torch.device('cuda:0')\n", - " tacotron2 = torch.hub.load('nvidia/DeepLearningExamples:torchhub', 'nvidia_tacotron2', **{'map_location': device})\n", - "else:\n", - " device = torch.device('cpu')\n", - " tacotron2 = None\n", - " print('Unfortunately, Tacotron2 by NVIDIA infers only on GPU, so the Part 4 will not work on CPU-only machine.')" - ], - "execution_count": 4, - "outputs": [ - { - "output_type": "stream", - "name": "stderr", - "text": [ - "Downloading: \"https://github.com/nvidia/DeepLearningExamples/archive/torchhub.zip\" to /root/.cache/torch/hub/torchhub.zip\n", - "Downloading checkpoint from https://api.ngc.nvidia.com/v2/models/nvidia/tacotron2_pyt_ckpt_fp32/versions/19.09.0/files/nvidia_tacotron2pyt_fp32_20190427\n" - ] - } - ] - }, - { - "cell_type": "code", - "metadata": { - "id": "0Eo7EPQT7rRN", - "outputId": "ca159a7d-bdb3-4098-8847-3b281765dcd7", - "colab": { - "base_uri": "https://localhost:8080/" - } - }, - "source": [ - "# Pre-downloading the BERT for Russian language\n", "\n", - "!wget https://www.dropbox.com/s/7za1o6vaffbdlcg/rubert_cased_L-12_H-768_A-12_v1.tar.gz -nc\n", - "!wget https://www.dropbox.com/s/ns8280pd9t9n9dc/squad_model_ru_rubert.tar.gz -nc\n", + "assert torch.cuda.is_available(), 'Tacotron2 by NVIDIA infers only on GPU, so the Part 4 will not work on CPU-only machine'\n", "\n", - "!mkdir -p /root/.deeppavlov/downloads/bert_models/\n", - "!mkdir -p /root/.deeppavlov/models/\n", + "device = torch.device('cuda:0')\n", + "tacotron2 = torch.hub.load('nvidia/DeepLearningExamples:torchhub', 'nvidia_tacotron2', **{'map_location': device})\n", + "tacotron2.to(device)\n", + "tacotron2.eval()\n", "\n", - "!tar -xzvf rubert_cased_L-12_H-768_A-12_v1.tar.gz -C /root/.deeppavlov/downloads/bert_models\n", - "!tar -xzvf squad_model_ru_rubert.tar.gz -C /root/.deeppavlov/models" + "waveglow = torch.hub.load('nvidia/DeepLearningExamples:torchhub', 'nvidia_waveglow')\n", + "waveglow = waveglow.remove_weightnorm(waveglow)\n", + "waveglow.to(device)\n", + "waveglow.eval();" ], - "execution_count": 5, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "--2021-10-14 22:35:20-- https://www.dropbox.com/s/7za1o6vaffbdlcg/rubert_cased_L-12_H-768_A-12_v1.tar.gz\n", - "Resolving www.dropbox.com (www.dropbox.com)... 162.125.66.18, 2620:100:6020:18::a27d:4012\n", - "Connecting to www.dropbox.com (www.dropbox.com)|162.125.66.18|:443... connected.\n", - "HTTP request sent, awaiting response... 301 Moved Permanently\n", - "Location: /s/raw/7za1o6vaffbdlcg/rubert_cased_L-12_H-768_A-12_v1.tar.gz [following]\n", - "--2021-10-14 22:35:20-- https://www.dropbox.com/s/raw/7za1o6vaffbdlcg/rubert_cased_L-12_H-768_A-12_v1.tar.gz\n", - "Reusing existing connection to www.dropbox.com:443.\n", - "HTTP request sent, awaiting response... 302 Found\n", - "Location: https://uc713e477e604b7cf18cb46ad6ba.dl.dropboxusercontent.com/cd/0/inline/BYDBS5Bfh4mRY4PPZxgT35OmzVNMdPk-EqUTu6qrFFi219ERjwKRH379E_BmXwhfICcOEWhmufZsuoXrXJosp1YhtxyrKaopgNjFzsbeQB-9NeqSGmIePE2PeB033CLbrj-P9nGFedoJO34VHc5izRGS/file# [following]\n", - "--2021-10-14 22:35:20-- https://uc713e477e604b7cf18cb46ad6ba.dl.dropboxusercontent.com/cd/0/inline/BYDBS5Bfh4mRY4PPZxgT35OmzVNMdPk-EqUTu6qrFFi219ERjwKRH379E_BmXwhfICcOEWhmufZsuoXrXJosp1YhtxyrKaopgNjFzsbeQB-9NeqSGmIePE2PeB033CLbrj-P9nGFedoJO34VHc5izRGS/file\n", - "Resolving uc713e477e604b7cf18cb46ad6ba.dl.dropboxusercontent.com (uc713e477e604b7cf18cb46ad6ba.dl.dropboxusercontent.com)... 162.125.66.15, 2620:100:6020:15::a27d:400f\n", - "Connecting to uc713e477e604b7cf18cb46ad6ba.dl.dropboxusercontent.com (uc713e477e604b7cf18cb46ad6ba.dl.dropboxusercontent.com)|162.125.66.15|:443... connected.\n", - "HTTP request sent, awaiting response... 302 Found\n", - "Location: /cd/0/inline2/BYALptvPCHi9Y0VW6CALJI_Y0Pnt0wGtPLScpY3YbfGQtrv0lD7gfiE324E68ajiM8mRtxo9zTBK8w2-a7Rj7mGJP1eggnd7a1ss2qTsnSs5XkIhVW4qec9Ho7JYC28HwLv7KYK_8rl-yeSm89wdCRQrgIRxv3WEGEvAVJAsiow6qOf7JGwGP0m6xhTMHbU4N-2_8D8lse78RFK16wpJAcqGtYYuOXdPxnC_YJzh9nZMIfY2W8rCYu4afR1Lqb9FgxQmAL17gpri5H612BLXlLn2v9Owt-kAkFsZv5LM22lfEXJyhSvCfthjhapc9FTrFUIq9NowQSQv_2mJu0oCLxo9XoyMLoOs2cXip9vKsHm71MkfLgEwiTZDpP-Umtll18w/file [following]\n", - "--2021-10-14 22:35:21-- https://uc713e477e604b7cf18cb46ad6ba.dl.dropboxusercontent.com/cd/0/inline2/BYALptvPCHi9Y0VW6CALJI_Y0Pnt0wGtPLScpY3YbfGQtrv0lD7gfiE324E68ajiM8mRtxo9zTBK8w2-a7Rj7mGJP1eggnd7a1ss2qTsnSs5XkIhVW4qec9Ho7JYC28HwLv7KYK_8rl-yeSm89wdCRQrgIRxv3WEGEvAVJAsiow6qOf7JGwGP0m6xhTMHbU4N-2_8D8lse78RFK16wpJAcqGtYYuOXdPxnC_YJzh9nZMIfY2W8rCYu4afR1Lqb9FgxQmAL17gpri5H612BLXlLn2v9Owt-kAkFsZv5LM22lfEXJyhSvCfthjhapc9FTrFUIq9NowQSQv_2mJu0oCLxo9XoyMLoOs2cXip9vKsHm71MkfLgEwiTZDpP-Umtll18w/file\n", - "Reusing existing connection to uc713e477e604b7cf18cb46ad6ba.dl.dropboxusercontent.com:443.\n", - "HTTP request sent, awaiting response... 200 OK\n", - "Length: 666147468 (635M) [application/octet-stream]\n", - "Saving to: ‘rubert_cased_L-12_H-768_A-12_v1.tar.gz’\n", - "\n", - "rubert_cased_L-12_H 100%[===================>] 635.29M 25.2MB/s in 29s \n", - "\n", - "2021-10-14 22:35:50 (21.8 MB/s) - ‘rubert_cased_L-12_H-768_A-12_v1.tar.gz’ saved [666147468/666147468]\n", - "\n", - "--2021-10-14 22:35:51-- https://www.dropbox.com/s/ns8280pd9t9n9dc/squad_model_ru_rubert.tar.gz\n", - "Resolving www.dropbox.com (www.dropbox.com)... 162.125.67.18, 2620:100:6020:18::a27d:4012\n", - "Connecting to www.dropbox.com (www.dropbox.com)|162.125.67.18|:443... connected.\n", - "HTTP request sent, awaiting response... 301 Moved Permanently\n", - "Location: /s/raw/ns8280pd9t9n9dc/squad_model_ru_rubert.tar.gz [following]\n", - "--2021-10-14 22:35:51-- https://www.dropbox.com/s/raw/ns8280pd9t9n9dc/squad_model_ru_rubert.tar.gz\n", - "Reusing existing connection to www.dropbox.com:443.\n", - "HTTP request sent, awaiting response... 302 Found\n", - "Location: https://ucde331d1be59b6d375177d093b7.dl.dropboxusercontent.com/cd/0/inline/BYCOSap_BO6iW_IFwYyrbCxuFhsRMyFCU0YYh3kmx-mle3_0LAgKEBXhMWjU-9_RS56XN6gFI1QuFtr04cd8RyDm0P8KIygxe7IB5wGsUVI6pzEJO79xWB3rYAbpdh23Mes9gQiT84_CDA2iFLUqiiO0/file# [following]\n", - "--2021-10-14 22:35:51-- https://ucde331d1be59b6d375177d093b7.dl.dropboxusercontent.com/cd/0/inline/BYCOSap_BO6iW_IFwYyrbCxuFhsRMyFCU0YYh3kmx-mle3_0LAgKEBXhMWjU-9_RS56XN6gFI1QuFtr04cd8RyDm0P8KIygxe7IB5wGsUVI6pzEJO79xWB3rYAbpdh23Mes9gQiT84_CDA2iFLUqiiO0/file\n", - "Resolving ucde331d1be59b6d375177d093b7.dl.dropboxusercontent.com (ucde331d1be59b6d375177d093b7.dl.dropboxusercontent.com)... 162.125.66.15, 2620:100:6020:15::a27d:400f\n", - "Connecting to ucde331d1be59b6d375177d093b7.dl.dropboxusercontent.com (ucde331d1be59b6d375177d093b7.dl.dropboxusercontent.com)|162.125.66.15|:443... connected.\n", - "HTTP request sent, awaiting response... 302 Found\n", - "Location: /cd/0/inline2/BYB1fbIxGEWEFAsDaD4e8r8B7_zt8i8urfo3_uGN-dHV3CkX1WsqBMwoKCCVospxbzhRnOpPbEPrQNXYa1OrIWpv0KzlvQRR7zSW6V0ts8vXragHK1Bqaq0xpvqI8uiFZFAovwP1FojsGxZjl9dcL7A2v6CEqkbLFKA6UDHEEbQoc4OM5z3XnrqEfg1YdUIdDcLelkRyy7BaID4v2Vu9gFwr5dla7lNNVRU0uMbuaXzkiLGreV5Va0j6lZ-eKUtBcVk5OoLVGEAEG9OzlrjlJF2U9dTviCDlVNA77fQxdrq-haksglPaPMMj9eMXZdBVoZBd1nIKGYkirQgzf2VezY6iVkodb9Jrr3mg-9y5GR2eZW1P7U8aeFfyd6AzWkQBFmw/file [following]\n", - "--2021-10-14 22:35:52-- https://ucde331d1be59b6d375177d093b7.dl.dropboxusercontent.com/cd/0/inline2/BYB1fbIxGEWEFAsDaD4e8r8B7_zt8i8urfo3_uGN-dHV3CkX1WsqBMwoKCCVospxbzhRnOpPbEPrQNXYa1OrIWpv0KzlvQRR7zSW6V0ts8vXragHK1Bqaq0xpvqI8uiFZFAovwP1FojsGxZjl9dcL7A2v6CEqkbLFKA6UDHEEbQoc4OM5z3XnrqEfg1YdUIdDcLelkRyy7BaID4v2Vu9gFwr5dla7lNNVRU0uMbuaXzkiLGreV5Va0j6lZ-eKUtBcVk5OoLVGEAEG9OzlrjlJF2U9dTviCDlVNA77fQxdrq-haksglPaPMMj9eMXZdBVoZBd1nIKGYkirQgzf2VezY6iVkodb9Jrr3mg-9y5GR2eZW1P7U8aeFfyd6AzWkQBFmw/file\n", - "Reusing existing connection to ucde331d1be59b6d375177d093b7.dl.dropboxusercontent.com:443.\n", - "HTTP request sent, awaiting response... 200 OK\n", - "Length: 659197396 (629M) [application/octet-stream]\n", - "Saving to: ‘squad_model_ru_rubert.tar.gz’\n", - "\n", - "squad_model_ru_rube 100%[===================>] 628.66M 15.4MB/s in 39s \n", - "\n", - "2021-10-14 22:36:32 (16.0 MB/s) - ‘squad_model_ru_rubert.tar.gz’ saved [659197396/659197396]\n", - "\n", - "rubert_cased_L-12_H-768_A-12_v1/\n", - "rubert_cased_L-12_H-768_A-12_v1/bert_config.json\n", - "rubert_cased_L-12_H-768_A-12_v1/vocab.txt\n", - "rubert_cased_L-12_H-768_A-12_v1/bert_model.ckpt.data-00000-of-00001\n", - "rubert_cased_L-12_H-768_A-12_v1/bert_model.ckpt.index\n", - "rubert_cased_L-12_H-768_A-12_v1/bert_model.ckpt.meta\n", - "squad_ru_bert/\n", - "squad_ru_bert/model_rubert.data-00000-of-00001\n", - "squad_ru_bert/model_rubert.index\n", - "squad_ru_bert/model_rubert.meta\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -1042,7 +113,7 @@ "id": "X2bUvKUffHNY" }, "source": [ - "## Part 1: How BERT is applied to Question Answering" + "## Part 1: Applying BERT to Question Answering" ] }, { @@ -1062,7 +133,7 @@ "source": [ "When someone mentions \"Question Answering\" as an application of BERT, what they are really referring to is applying BERT to the Stanford Question Answering Dataset (SQuAD).\n", "\n", - "The task posed by the SQuAD benchmark is a little different than you might think. Given a question, and *a passage of text containing the answer*, BERT needs to highlight the \"span\" of text corresponding to the correct answer. \n", + "The task posed by the SQuAD benchmark is a little different than you might think. Given a question, and *a passage of text containing the answer* (often refered to as context), BERT needs to highlight the \"span\" of text corresponding to the correct answer. \n", "\n", "The SQuAD homepage has a fantastic tool for exploring the questions and reference text for this dataset, and even shows the predictions made by top-performing models.\n", "\n", @@ -1091,7 +162,7 @@ "\n", "The two pieces of text are separated by the special `[SEP]` token. \n", "\n", - "BERT also uses \"Segment Embeddings\" to differentiate the question from the reference text. These are simply two embeddings (for segments \"A\" and \"B\") that BERT learned, and which it adds to the token embeddings before feeding them into the input layer. " + "> _Side note:_ Original BERT also uses \"Segment Embeddings\" to differentiate the question from the reference text. These are simply two embeddings (for segments \"A\" and \"B\") that BERT learned, and which it adds to the token embeddings before feeding them into the input layer. However today we will be using DistilBERT model, which relies solely on the special tokens." ] }, { @@ -1141,9 +212,7 @@ "source": [ "In the example code below, we'll be downloading a model that's *already been fine-tuned* for question answering, and try it out on our own text.\n", "\n", - "If you do want to fine-tune on your own dataset, it is possible to fine-tune BERT for question answering yourself. See [run_squad.py](https://github.com/huggingface/transformers/blob/master/examples/run_squad.py) in the `transformers` library. However,you may find that the below \"fine-tuned-on-squad\" model already does a good job, even if your text is from a different domain. \n", - "\n", - "> Note: The example code in this Notebook is a commented and expanded version of the short example provided in the `transformers` documentation [here](https://huggingface.co/transformers/model_doc/bert.html?highlight=bertforquestionanswering#transformers.BertForQuestionAnswering)." + "If you do want to fine-tune on your own dataset, it is possible to fine-tune BERT for question answering yourself. See [run_squad.py](https://github.com/huggingface/transformers/blob/master/examples/run_squad.py) in the `transformers` library. However, you may find that the \"fine-tuned-on-squad\" model already does a good job, even if your text is from a different domain." ] }, { @@ -1152,7 +221,7 @@ "id": "gVq-TuylYRDW" }, "source": [ - "### 1. huggingface transformers library" + "### 1. Load Fine-Tuned BERT" ] }, { @@ -1161,75 +230,28 @@ "id": "f9nhy3PzGQ44" }, "source": [ - "This example uses the `transformers` [library](https://github.com/huggingface/transformers/) by huggingface. We've already installed it in the top of this notebook." - ] - }, - { - "cell_type": "code", - "metadata": { - "id": "-ONLrgJK99TQ" - }, - "source": [ - "import torch" - ], - "execution_count": 6, - "outputs": [] - }, - { - "cell_type": "markdown", - "metadata": { - "id": "1WThOUtpYvG-" - }, - "source": [ - "### 2. Load Fine-Tuned BERT-large" - ] - }, - { - "cell_type": "markdown", - "metadata": { - "id": "AaweLnNXGhTY" - }, - "source": [ - "For Question Answering we use the `BertForQuestionAnswering` class from the `transformers` library.\n", - "\n", - "This class supports fine-tuning, but for this example we will keep things simpler and load a BERT model that has already been fine-tuned for the SQuAD benchmark.\n", - "\n", - "The `transformers` library has a large collection of pre-trained models which you can reference by name and load easily. The full list is in their documentation [here](https://huggingface.co/transformers/pretrained_models.html).\n", - "\n", - "For Question Answering, they have a version of BERT-large that has already been fine-tuned for the SQuAD benchmark. \n", + "This example uses the `transformers` [library](https://github.com/huggingface/transformers/) by huggingface. We've already installed it in the top of this notebook.\n", "\n", - "BERT-large is really big... it has 24-layers and an embedding size of 1,024, for a total of 340M parameters! Altogether it is 1.34GB, so expect it to take a couple minutes to download to your Colab instance. \n", + "For Question Answering we use the `DistilBertForQuestionAnswering` class from the `transformers` library.\n", "\n", - "(Note that this download is not using your own network bandwidth--it's between the Google instance and wherever the model is stored on the web).\n", + "This class supports fine-tuning, but for this example we will keep things simpler and load a BERT model that has already been fine-tuned for the SQuAD benchmark.\n", "\n", - "Note: I believe this model was trained on version 1 of SQuAD, since it's not outputting whether the question is \"impossible\" to answer from the text (which is part of the task in v2 of SQuAD).\n" + "The `transformers` library has a large collection of pre-trained models which you can reference by name and load easily. The full list is in their documentation [here](https://huggingface.co/transformers/pretrained_models.html)." ] }, { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "apS1yS6CdRyX", - "outputId": "bbf150db-579b-4094-c705-6624de9935a7" + "id": "apS1yS6CdRyX" }, "source": [ - "from transformers import DistilBertForQuestionAnswering\n", + "from transformers import DistilBertTokenizer, DistilBertForQuestionAnswering\n", "\n", - "model = DistilBertForQuestionAnswering.from_pretrained('distilbert-base-uncased-distilled-squad')\n" + "tokenizer = DistilBertTokenizer.from_pretrained('distilbert-base-uncased-distilled-squad')\n", + "model = DistilBertForQuestionAnswering.from_pretrained('distilbert-base-uncased-distilled-squad')" ], - "execution_count": 72, - "outputs": [ - { - "output_type": "stream", - "name": "stderr", - "text": [ - "/usr/local/lib/python3.7/dist-packages/cryptography/hazmat/backends/openssl/x509.py:18: CryptographyDeprecationWarning: This version of cryptography contains a temporary pyOpenSSL fallback path. Upgrade pyOpenSSL now.\n", - " utils.DeprecatedIn35,\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -1237,35 +259,7 @@ "id": "8imoOxoqGZ0h" }, "source": [ - "Load the tokenizer as well. \n", - "\n", - "Side note: Apparently the vocabulary of this model is identicaly to the one in bert-base-uncased. You can load the tokenizer from `bert-base-uncased` and that works just as well." - ] - }, - { - "cell_type": "code", - "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "bv60qO4teAUL", - "outputId": "63160a72-6b5c-42f2-e047-35dd017475f2" - }, - "source": [ - "from transformers import DistilBertTokenizer\n", - "\n", - "tokenizer = DistilBertTokenizer.from_pretrained('distilbert-base-uncased-distilled-squad')" - ], - "execution_count": 73, - "outputs": [ - { - "output_type": "stream", - "name": "stderr", - "text": [ - "/usr/local/lib/python3.7/dist-packages/cryptography/hazmat/backends/openssl/x509.py:18: CryptographyDeprecationWarning: This version of cryptography contains a temporary pyOpenSSL fallback path. Upgrade pyOpenSSL now.\n", - " utils.DeprecatedIn35,\n" - ] - } + "> _Side note:_ Apparently the vocabulary of this model is identicaly to the one in bert-base-uncased. You can load the tokenizer from `bert-base-uncased` and that works just as well." ] }, { @@ -1274,7 +268,7 @@ "id": "I__1ubvcZYow" }, "source": [ - "### 3. Ask a Question" + "### 2. Ask a Question" ] }, { @@ -1285,9 +279,7 @@ "source": [ "Now we're ready to feed in an example!\n", "\n", - "A QA example consists of a question and a passage of text containing the answer to that question.\n", - "\n", - "Let's try an example using the text in this tutorial!" + "A QA example consists of a question and a passage of text containing the answer to that question." ] }, { @@ -1297,9 +289,13 @@ }, "source": [ "question = \"How many parameters does BERT-large have?\"\n", - "answer_text = \"BERT-large is really big... it has 24-layers and an embedding size of 1,024, for a total of 340M parameters! Altogether it is 1.34GB, so expect it to take a couple minutes to download to your Colab instance.\"" + "context = (\n", + " \"BERT-large is really big... it has 24-layers and an embedding size of 1,024, \"\n", + " \"for a total of 340M parameters! Altogether it is 1.34GB, so expect it to \"\n", + " \"take a couple minutes to download to your Colab instance.\"\n", + ")" ], - "execution_count": 9, + "execution_count": null, "outputs": [] }, { @@ -1308,34 +304,21 @@ "id": "llLvxhScKLZn" }, "source": [ - "We'll need to run the BERT tokenizer against both the `question` and the `answer_text`. To feed these into BERT, we actually concatenate them together and place the special [SEP] token in between.\n" + "We'll need to run the BERT tokenizer against both the `question` and the `context`. To feed these into BERT, we actually concatenate them together and place the special `[SEP]` token in between.\n" ] }, { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "tYoX33CfKGsr", - "outputId": "906e30a7-f04c-4e1b-a2c9-e47369b8a910" + "id": "tYoX33CfKGsr" }, "source": [ "# Apply the tokenizer to the input text, treating them as a text-pair.\n", - "input_ids = tokenizer.encode(question, answer_text)\n", - "\n", - "print('The input has a total of {:} tokens.'.format(len(input_ids)))" + "input_ids = tokenizer.encode(question, context)\n", + "print(f'The input has a total of {len(input_ids)} tokens.')" ], - "execution_count": 10, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "The input has a total of 70 tokens.\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -1349,134 +332,29 @@ { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "Iow838yPNDTv", - "outputId": "e4454942-906f-4b11-d11f-3f1e3ff016cf" + "id": "Iow838yPNDTv" }, "source": [ "# BERT only needs the token IDs, but for the purpose of inspecting the \n", "# tokenizer's behavior, let's also get the token strings and display them.\n", "tokens = tokenizer.convert_ids_to_tokens(input_ids)\n", "\n", + "# Display tokens and ids as table.\n", "# For each token and its id...\n", - "for token, id in zip(tokens, input_ids):\n", + "for token, token_id in zip(tokens, input_ids):\n", " \n", " # If this is the [SEP] token, add some space around it to make it stand out.\n", - " if id == tokenizer.sep_token_id:\n", - " print('')\n", + " if token_id == tokenizer.sep_token_id:\n", + " print()\n", " \n", " # Print the token string and its ID in two columns.\n", - " print('{:<12} {:>6,}'.format(token, id))\n", + " print('{:<12} {:>6,}'.format(token, token_id))\n", "\n", - " if id == tokenizer.sep_token_id:\n", - " print('')\n", - " " + " if token_id == tokenizer.sep_token_id:\n", + " print()" ], - "execution_count": 11, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "[CLS] 101\n", - "how 2,129\n", - "many 2,116\n", - "parameters 11,709\n", - "does 2,515\n", - "bert 14,324\n", - "- 1,011\n", - "large 2,312\n", - "have 2,031\n", - "? 1,029\n", - "\n", - "[SEP] 102\n", - "\n", - "bert 14,324\n", - "- 1,011\n", - "large 2,312\n", - "is 2,003\n", - "really 2,428\n", - "big 2,502\n", - ". 1,012\n", - ". 1,012\n", - ". 1,012\n", - "it 2,009\n", - "has 2,038\n", - "24 2,484\n", - "- 1,011\n", - "layers 9,014\n", - "and 1,998\n", - "an 2,019\n", - "em 7,861\n", - "##bed 8,270\n", - "##ding 4,667\n", - "size 2,946\n", - "of 1,997\n", - "1 1,015\n", - ", 1,010\n", - "02 6,185\n", - "##4 2,549\n", - ", 1,010\n", - "for 2,005\n", - "a 1,037\n", - "total 2,561\n", - "of 1,997\n", - "340 16,029\n", - "##m 2,213\n", - "parameters 11,709\n", - "! 999\n", - "altogether 10,462\n", - "it 2,009\n", - "is 2,003\n", - "1 1,015\n", - ". 1,012\n", - "34 4,090\n", - "##gb 18,259\n", - ", 1,010\n", - "so 2,061\n", - "expect 5,987\n", - "it 2,009\n", - "to 2,000\n", - "take 2,202\n", - "a 1,037\n", - "couple 3,232\n", - "minutes 2,781\n", - "to 2,000\n", - "download 8,816\n", - "to 2,000\n", - "your 2,115\n", - "cola 15,270\n", - "##b 2,497\n", - "instance 6,013\n", - ". 1,012\n", - "\n", - "[SEP] 102\n", - "\n" - ] - } - ] - }, - { - "cell_type": "markdown", - "metadata": { - "id": "zm208EApN16k" - }, - "source": [ - "We've concatenated the `question` and `answer_text` together, but BERT still needs a way to distinguish them. BERT has two special \"Segment\" embeddings, one for segment \"A\" and one for segment \"B\". Before the word embeddings go into the BERT layers, the segment A embedding needs to be added to the `question` tokens, and the segment B embedding needs to be added to each of the `answer_text` tokens." - ] - }, - { - "cell_type": "markdown", - "metadata": { - "id": "a30sBTcqQv6X" - }, - "source": [ - ">*Side Note: Where's the padding?*\n", - ">\n", - "> The original [example code](https://huggingface.co/transformers/model_doc/bert.html?highlight=bertforquestionanswering#transformers.BertForQuestionAnswering) does not perform any padding. I suspect that this is because we are only feeding in a *single example*. If we instead fed in a batch of examples, then we would need to pad or truncate all of the samples in the batch to a single length, and supply an attention mask to tell BERT to ignore the padding tokens. " - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -1494,30 +372,29 @@ "id": "HK0obn5x-1EI" }, "source": [ - "inputs = tokenizer(question, answer_text, return_tensors='pt')\n", - "start_positions = torch.tensor([1])\n", - "end_positions = torch.tensor([3])\n", + "import torch\n", "\n", - "outputs = model(**inputs, start_positions=start_positions, end_positions=end_positions)\n", + "inputs = tokenizer(question, context, return_tensors='pt')\n", + "with torch.no_grad():\n", + " outputs = model(**inputs)\n", "\n", "start_scores = outputs.start_logits\n", - "end_scores = outputs.end_logits" + "end_scores = outputs.end_logits\n", + "start_scores" ], - "execution_count": 17, + "execution_count": null, "outputs": [] }, { - "cell_type": "code", + "cell_type": "markdown", "metadata": { - "id": "DQiKr6Aw-YTg" + "id": "a30sBTcqQv6X" }, "source": [ - "# Run our example through the model.\n", - "# start_scores, end_scores = model(torch.tensor([input_ids])) # The tokens representing our input text.\n", - "\n" - ], - "execution_count": 18, - "outputs": [] + ">*Side Note: Where's the padding?*\n", + ">\n", + "> The original [example code](https://huggingface.co/transformers/model_doc/bert.html?highlight=bertforquestionanswering#transformers.BertForQuestionAnswering) does not perform any padding. I suspect that this is because we are only feeding in a *single example*. If we instead fed in a batch of examples, then we would need to pad or truncate all of the samples in the batch to a single length, and supply an attention mask to tell BERT to ignore the padding tokens. " + ] }, { "cell_type": "markdown", @@ -1531,46 +408,7 @@ { "cell_type": "code", "metadata": { - "id": "uC2ArgLf-Pi3", - "outputId": "43834471-7224-47df-9437-414b05c9c89a", - "colab": { - "base_uri": "https://localhost:8080/" - } - }, - "source": [ - "start_scores" - ], - "execution_count": 19, - "outputs": [ - { - "output_type": "execute_result", - "data": { - "text/plain": [ - "tensor([[-4.6549, -5.4920, -6.9543, -6.7978, -7.1190, -6.0274, -7.6631, -7.2082,\n", - " -7.0247, -7.7690, -5.1297, -0.3305, -5.2058, -3.4652, -5.0982, -3.6160,\n", - " -3.1994, -5.3622, -4.9089, -4.3704, 0.1852, -3.1188, 0.8591, -4.5655,\n", - " -3.5403, -5.3101, -2.1212, -2.7155, -5.5414, -5.5158, -3.3945, -4.0354,\n", - " 3.2313, -3.4973, -3.2838, -3.3052, -5.1053, 0.2443, 2.3932, 2.4217,\n", - " -1.7133, 8.3842, -0.9214, -2.0461, -3.8585, -0.5486, -2.0815, -5.2040,\n", - " -0.2521, -4.4770, -1.9723, -4.0387, -5.5288, -5.0099, -5.4694, -5.3426,\n", - " -6.2675, -5.2602, -4.2696, -3.3130, -5.1041, -6.8950, -4.9450, -7.1310,\n", - " -6.1638, -4.3083, -6.5881, -5.6170, -6.0569, -5.1298]],\n", - " grad_fn=)" - ] - }, - "metadata": {}, - "execution_count": 19 - } - ] - }, - { - "cell_type": "code", - "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "LeUQ44hAJmn9", - "outputId": "4a0b27eb-cbe5-45b2-cd86-46c37f284c31" + "id": "LeUQ44hAJmn9" }, "source": [ "# Find the tokens with the highest `start` and `end` scores.\n", @@ -1578,20 +416,12 @@ "answer_end = torch.argmax(end_scores)\n", "\n", "# Combine the tokens in the answer and print it out.\n", - "answer = ' '.join(tokens[answer_start:answer_end+1])\n", + "answer = ' '.join(tokens[answer_start : answer_end + 1])\n", "\n", - "print('Answer: \"' + answer + '\"')" + "print(f'Answer: \"{answer}\"')" ], - "execution_count": 20, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Answer: \"340 ##m\"\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -1623,39 +453,14 @@ { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "Khral6HZXCuI", - "outputId": "814ba769-d3cc-48af-8a0f-9c2275ac8f74" + "id": "pBrAsWMJrw7i" }, "source": [ - "# Start with the first token.\n", - "answer = tokens[answer_start]\n", - "\n", - "# Select the remaining answer tokens and join them with whitespace.\n", - "for i in range(answer_start + 1, answer_end + 1):\n", - " \n", - " # If it's a subword token, then recombine it with the previous token.\n", - " if tokens[i][0:2] == '##':\n", - " answer += tokens[i][2:]\n", - " \n", - " # Otherwise, add a space then the token.\n", - " else:\n", - " answer += ' ' + tokens[i]\n", - "\n", - "print('Answer: \"' + answer + '\"')" + "answer = tokenizer.convert_tokens_to_string(tokens[answer_start : answer_end + 1])\n", + "print(f'Answer: \"{answer}\"')" ], - "execution_count": 21, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Answer: \"340m\"\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -1663,7 +468,7 @@ "id": "-hh6nkIdXq-O" }, "source": [ - "### 4. Visualizing Scores" + "### 3. Visualizing Scores" ] }, { @@ -1688,10 +493,10 @@ "sns.set(style='darkgrid')\n", "\n", "# Increase the plot size and font size.\n", - "#sns.set(font_scale=1.5)\n", - "plt.rcParams[\"figure.figsize\"] = (16,8)" + "plt.rcParams['figure.figsize'] = (16, 8)\n", + "plt.rcParams['font.size'] = 16" ], - "execution_count": 22, + "execution_count": null, "outputs": [] }, { @@ -1710,16 +515,16 @@ }, "source": [ "# Pull the scores out of PyTorch Tensors and convert them to 1D numpy arrays.\n", - "s_scores = start_scores.detach().numpy().flatten()\n", - "e_scores = end_scores.detach().numpy().flatten()\n", + "start_scores = start_scores.numpy().flatten()\n", + "end_scores = end_scores.numpy().flatten()\n", "\n", "# We'll use the tokens as the x-axis labels. In order to do that, they all need\n", "# to be unique, so we'll add the token index to the end of each one.\n", "token_labels = []\n", "for (i, token) in enumerate(tokens):\n", - " token_labels.append('{:} - {:>2}'.format(token, i))\n" + " token_labels.append('{:} - {:>2}'.format(token, i))" ], - "execution_count": 23, + "execution_count": null, "outputs": [] }, { @@ -1734,38 +539,11 @@ { "cell_type": "code", "metadata": { - "id": "w2Np8FON7rRg" - }, - "source": [ - "import matplotlib" - ], - "execution_count": 24, - "outputs": [] - }, - { - "cell_type": "code", - "metadata": { - "id": "Xq3ZsP3L7rRg" - }, - "source": [ - "matplotlib.rcParams.update({'figure.figsize': (16, 12), 'font.size': 16})" - ], - "execution_count": 25, - "outputs": [] - }, - { - "cell_type": "code", - "metadata": { - "colab": { - "base_uri": "https://localhost:8080/", - "height": 756 - }, - "id": "y6OAV1dL3-UB", - "outputId": "9ae0038f-6c63-4365-ef06-0f750358a2c5" + "id": "y6OAV1dL3-UB" }, "source": [ "# Create a barplot showing the start word score for all of the tokens.\n", - "ax = sns.barplot(x=token_labels, y=s_scores, ci=None)\n", + "ax = sns.barplot(x=token_labels, y=start_scores, ci=None)\n", "\n", "# Turn the xlabels vertical.\n", "ax.set_xticklabels(ax.get_xticklabels(), rotation=90, ha=\"center\")\n", @@ -1773,23 +551,10 @@ "# Turn on the vertical grid to help align words to scores.\n", "ax.grid(True)\n", "\n", - "plt.title('Start Word Scores')\n", - "\n", - "plt.show()" + "plt.title('Start Word Scores');" ], - "execution_count": 26, - "outputs": [ - { - "output_type": "display_data", - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": {} - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -1803,16 +568,11 @@ { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/", - "height": 756 - }, - "id": "6tXEqIp-Tzou", - "outputId": "24e6ca48-f649-49b4-f08d-59d0ba691f13" + "id": "6tXEqIp-Tzou" }, "source": [ "# Create a barplot showing the end word score for all of the tokens.\n", - "ax = sns.barplot(x=token_labels, y=e_scores, ci=None)\n", + "ax = sns.barplot(x=token_labels, y=end_scores, ci=None)\n", "\n", "# Turn the xlabels vertical.\n", "ax.set_xticklabels(ax.get_xticklabels(), rotation=90, ha=\"center\")\n", @@ -1820,23 +580,10 @@ "# Turn on the vertical grid to help align words to scores.\n", "ax.grid(True)\n", "\n", - "plt.title('End Word Scores')\n", - "\n", - "plt.show()" + "plt.title('End Word Scores');" ], - "execution_count": 27, - "outputs": [ - { - "output_type": "display_data", - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": {} - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -1865,66 +612,41 @@ "\n", " # Add the token's start score as one row.\n", " scores.append({'token_label': token_label, \n", - " 'score': s_scores[i],\n", + " 'score': start_scores[i],\n", " 'marker': 'start'})\n", " \n", " # Add the token's end score as another row.\n", " scores.append({'token_label': token_label, \n", - " 'score': e_scores[i],\n", + " 'score': end_scores[i],\n", " 'marker': 'end'})\n", " \n", - "df = pd.DataFrame(scores)\n" - ], - "execution_count": 28, - "outputs": [] - }, - { - "cell_type": "code", - "metadata": { - "id": "85HYAszU7rRi" - }, - "source": [ - "sns.set(font_scale=1.8)" + "df = pd.DataFrame(scores)" ], - "execution_count": 29, + "execution_count": null, "outputs": [] }, { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/", - "height": 292 - }, - "id": "07xyo-I97Ntt", - "outputId": "9031d54e-5e9e-4554-b480-750854e77dc2" + "id": "07xyo-I97Ntt" }, "source": [ "# Draw a grouped barplot to show start and end scores for each word.\n", "# The \"hue\" parameter is where we tell it which datapoints belong to which\n", "# of the two series.\n", - "g = sns.catplot(x=\"token_label\", y=\"score\", hue=\"marker\", data=df,\n", - " kind=\"bar\", height=6, aspect=4)\n", + "plot = sns.catplot(\n", + " x=\"token_label\", y=\"score\", hue=\"marker\",\n", + " data=df, kind=\"bar\", height=6, aspect=4\n", + ")\n", "\n", "# Turn the xlabels vertical.\n", - "g.set_xticklabels(g.ax.get_xticklabels(), rotation=90, ha=\"center\")\n", + "plot.set_xticklabels(plot.ax.get_xticklabels(), rotation=90, ha=\"center\")\n", "\n", "# Turn on the vertical grid to help align words to scores.\n", - "g.ax.grid(True)\n" + "plot.ax.grid(True);" ], - "execution_count": 30, - "outputs": [ - { - "output_type": "display_data", - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": {} - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -1932,7 +654,7 @@ "id": "8UyBYNmeegGf" }, "source": [ - "### 5. More Examples" + "### 4. More Examples" ] }, { @@ -1950,31 +672,17 @@ "id": "rH8NbBlsfxZ_" }, "source": [ - "def answer_question(question, answer_text):\n", - " '''\n", - " Takes a `question` string and an `answer_text` string (which contains the\n", - " answer), and identifies the words within the `answer_text` that are the\n", - " answer. Prints them out.\n", - " '''\n", + "def answer_question(question, context):\n", " # ======== Tokenize ========\n", " # Apply the tokenizer to the input text, treating them as a text-pair.\n", - " inputs = tokenizer(question, answer_text, return_tensors='pt')\n", - " input_ids = tokenizer.encode(question, answer_text)\n", - "\n", - " start_positions = torch.tensor([1])\n", - " end_positions = torch.tensor([3])\n", - "\n", - "\n", - " # Report how long the input sequence is.\n", - " # print('Query has {:,} tokens.\\n'.format(len(input_ids)))\n", + " inputs = tokenizer(question, context, return_tensors='pt')\n", + " input_ids = inputs.input_ids.numpy().flatten()\n", "\n", " # ======== Evaluate ========\n", " # Run our example question through the model.\n", - " outputs = model(**inputs, start_positions=start_positions, end_positions=end_positions)\n", - "\n", + " outputs = model(**inputs)\n", " start_scores = outputs.start_logits\n", " end_scores = outputs.end_logits\n", - " # token_type_ids=torch.tensor([segment_ids])) # The segment IDs to differentiate question from answer_text\n", "\n", " # ======== Reconstruct Answer ========\n", " # Find the tokens with the highest `start` and `end` scores.\n", @@ -1982,26 +690,13 @@ " answer_end = torch.argmax(end_scores)\n", "\n", " # Get the string versions of the input tokens.\n", - " tokens = tokenizer.convert_ids_to_tokens(input_ids)\n", - "\n", - " # Start with the first token.\n", - " answer = tokens[answer_start]\n", - "\n", - " # Select the remaining answer tokens and join them with whitespace.\n", - " for i in range(answer_start + 1, answer_end + 1):\n", - " \n", - " # If it's a subword token, then recombine it with the previous token.\n", - " if tokens[i][0:2] == '##':\n", - " answer += tokens[i][2:]\n", - " \n", - " # Otherwise, add a space then the token.\n", - " else:\n", - " answer += ' ' + tokens[i]\n", - "\n", - " print('Answer: \"' + answer + '\"')\n", + " token_ids = input_ids[answer_start : answer_end + 1]\n", + " tokens = tokenizer.convert_ids_to_tokens(token_ids)\n", + " answer = tokenizer.convert_tokens_to_string(tokens)\n", + "\n", " return answer" ], - "execution_count": 34, + "execution_count": null, "outputs": [] }, { @@ -2016,80 +711,50 @@ { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "y4VPq6FdjxyX", - "outputId": "e2991979-0599-43fd-ab82-10d9795018e9" - }, - "source": [ - "import textwrap\n", - "\n", - "# Wrap text to 80 characters.\n", - "wrapper = textwrap.TextWrapper(width=80) \n", - "\n", - "bert_abstract = \"We introduce a new language representation model called BERT, which stands for Bidirectional Encoder Representations from Transformers. Unlike recent language representation models (Peters et al., 2018a; Radford et al., 2018), BERT is designed to pretrain deep bidirectional representations from unlabeled text by jointly conditioning on both left and right context in all layers. As a result, the pre-trained BERT model can be finetuned with just one additional output layer to create state-of-the-art models for a wide range of tasks, such as question answering and language inference, without substantial taskspecific architecture modifications. BERT is conceptually simple and empirically powerful. It obtains new state-of-the-art results on eleven natural language processing tasks, including pushing the GLUE score to 80.5% (7.7% point absolute improvement), MultiNLI accuracy to 86.7% (4.6% absolute improvement), SQuAD v1.1 question answering Test F1 to 93.2 (1.5 point absolute improvement) and SQuAD v2.0 Test F1 to 83.1 (5.1 point absolute improvement).\"\n", - "\n", - "print(wrapper.fill(bert_abstract))" + "id": "mqfBGgc8AKk2" + }, + "source": [ + "bert_abstract = (\n", + " 'We introduce a new language representation model called BERT, which stands for '\n", + " 'Bidirectional Encoder Representations from Transformers. Unlike recent language '\n", + " 'representation models (Peters et al., 2018a; Radford et al., 2018), BERT is '\n", + " 'designed to pretrain deep bidirectional representations from unlabeled text by '\n", + " 'jointly conditioning on both left and right context in all layers. As a result, '\n", + " 'the pre-trained BERT model can be finetuned with just one additional output '\n", + " 'layer to create state-of-the-art models for a wide range of tasks, such as '\n", + " 'question answering and language inference, without substantial taskspecific '\n", + " 'architecture modifications. BERT is conceptually simple and empirically '\n", + " 'powerful. It obtains new state-of-the-art results on eleven natural language '\n", + " 'processing tasks, including pushing the GLUE score to 80.5% (7.7% point absolute '\n", + " 'improvement), MultiNLI accuracy to 86.7% (4.6% absolute improvement), SQuAD v1.1 '\n", + " 'question answering Test F1 to 93.2 (1.5 point absolute improvement) and SQuAD '\n", + " 'v2.0 Test F1 to 83.1 (5.1 point absolute improvement).'\n", + ")" ], - "execution_count": 35, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "We introduce a new language representation model called BERT, which stands for\n", - "Bidirectional Encoder Representations from Transformers. Unlike recent language\n", - "representation models (Peters et al., 2018a; Radford et al., 2018), BERT is\n", - "designed to pretrain deep bidirectional representations from unlabeled text by\n", - "jointly conditioning on both left and right context in all layers. As a result,\n", - "the pre-trained BERT model can be finetuned with just one additional output\n", - "layer to create state-of-the-art models for a wide range of tasks, such as\n", - "question answering and language inference, without substantial taskspecific\n", - "architecture modifications. BERT is conceptually simple and empirically\n", - "powerful. It obtains new state-of-the-art results on eleven natural language\n", - "processing tasks, including pushing the GLUE score to 80.5% (7.7% point absolute\n", - "improvement), MultiNLI accuracy to 86.7% (4.6% absolute improvement), SQuAD v1.1\n", - "question answering Test F1 to 93.2 (1.5 point absolute improvement) and SQuAD\n", - "v2.0 Test F1 to 83.1 (5.1 point absolute improvement).\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", "metadata": { - "id": "tEB654YCknYv" + "id": "ay_mwbBJAP87" }, "source": [ - "-----------------------------\n", - "Ask BERT what its name stands for (the answer is in the first sentence of the abstract)." + "Let's ask BERT what its name stands for (the answer is in the first sentence of the abstract)." ] }, { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "wfntqRCBegGj", - "outputId": "92f2877e-5f6f-41a9-b268-cd86ca69ebca" + "id": "y4VPq6FdjxyX" }, "source": [ "question = \"What does the 'B' in BERT stand for?\"\n", - "\n", - "ans = answer_question(question, bert_abstract)" + "answer = answer_question(question, bert_abstract)\n", + "print(f'Answer: \"{answer}\"')" ], - "execution_count": 36, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Answer: \"bidirectional encoder representations from transformers\"\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -2097,8 +762,7 @@ "id": "B6HcijzxkTO9" }, "source": [ - "---------------------\n", - "Ask BERT about example applications of itself :)\n", + "Let's ask BERT about example applications of itself :)\n", "\n", "The answer to the question comes from this passage from the abstract: \n", "\n", @@ -2111,27 +775,15 @@ { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "MVNVGN5-gI06", - "outputId": "5f001a04-862d-4b8b-d7ba-b75ff259a141" + "id": "MVNVGN5-gI06" }, "source": [ "question = \"What are some example applications of BERT?\"\n", - "\n", - "ans = answer_question(question, bert_abstract)" + "answer = answer_question(question, bert_abstract)\n", + "print(f'Answer: \"{answer}\"')" ], - "execution_count": 37, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Answer: \"question answering and language inference\"\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -2139,145 +791,30 @@ "id": "WXAJ2wkV7rRl" }, "source": [ - "### Part 3. RuBERT for question answering.\n", - "Here we will use the model pre-trained on the SberQuAD dataset from the [SDSJ-2017 challenge problem B](https://github.com/sberbank-ai/data-science-journey-2017/tree/master/problem_B)." + "## Part 3. RuBERT for question answering." ] }, { - "cell_type": "code", + "cell_type": "markdown", "metadata": { - "id": "3JslS5CG7rRl" + "id": "TcnPsGzEbGL6" }, "source": [ - "from deeppavlov import build_model, configs" - ], - "execution_count": 38, - "outputs": [] + "Here we will use the model pre-trained on the SberQuAD dataset from the [SDSJ-2017 challenge problem B](https://github.com/sberbank-ai/data-science-journey-2017/tree/master/problem_B)." + ] }, { "cell_type": "code", "metadata": { - "id": "eUQ7oNQq7rRl", - "outputId": "8f86904e-238b-475c-a6b4-d29f166e6a9b", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "3JslS5CG7rRl" }, "source": [ + "from deeppavlov import build_model, configs\n", + "\n", "model_ru = build_model(configs.squad.squad_ru_rubert, download=False)" ], - "execution_count": 39, - "outputs": [ - { - "output_type": "stream", - "name": "stderr", - "text": [ - "[nltk_data] Downloading package punkt to /root/nltk_data...\n", - "[nltk_data] Unzipping tokenizers/punkt.zip.\n", - "[nltk_data] Downloading package stopwords to /root/nltk_data...\n", - "[nltk_data] Unzipping corpora/stopwords.zip.\n", - "[nltk_data] Downloading package perluniprops to /root/nltk_data...\n", - "[nltk_data] Unzipping misc/perluniprops.zip.\n", - "[nltk_data] Downloading package nonbreaking_prefixes to\n", - "[nltk_data] /root/nltk_data...\n" - ] - }, - { - "output_type": "stream", - "name": "stdout", - "text": [ - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/bert_dp/tokenization.py:125: The name tf.gfile.GFile is deprecated. Please use tf.io.gfile.GFile instead.\n", - "\n" - ] - }, - { - "output_type": "stream", - "name": "stderr", - "text": [ - "[nltk_data] Unzipping corpora/nonbreaking_prefixes.zip.\n" - ] - }, - { - "output_type": "stream", - "name": "stdout", - "text": [ - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/core/models/tf_model.py:37: The name tf.Session is deprecated. Please use tf.compat.v1.Session instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/core/models/tf_model.py:222: The name tf.placeholder is deprecated. Please use tf.compat.v1.placeholder instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/core/models/tf_model.py:222: The name tf.train.Optimizer is deprecated. Please use tf.compat.v1.train.Optimizer instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/core/models/tf_model.py:193: The name tf.train.AdamOptimizer is deprecated. Please use tf.compat.v1.train.AdamOptimizer instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/models/bert/bert_squad.py:81: The name tf.ConfigProto is deprecated. Please use tf.compat.v1.ConfigProto instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/models/bert/bert_squad.py:178: The name tf.placeholder_with_default is deprecated. Please use tf.compat.v1.placeholder_with_default instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/bert_dp/modeling.py:178: The name tf.variable_scope is deprecated. Please use tf.compat.v1.variable_scope instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/bert_dp/modeling.py:418: The name tf.get_variable is deprecated. Please use tf.compat.v1.get_variable instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/bert_dp/modeling.py:499: The name tf.assert_less_equal is deprecated. Please use tf.compat.v1.assert_less_equal instead.\n", - "\n", - "WARNING:tensorflow:\n", - "The TensorFlow contrib module will not be included in TensorFlow 2.0.\n", - "For more information, please see:\n", - " * https://github.com/tensorflow/community/blob/master/rfcs/20180907-contrib-sunset.md\n", - " * https://github.com/tensorflow/addons\n", - " * https://github.com/tensorflow/io (for I/O related ops)\n", - "If you depend on functionality not listed there, please file an issue.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/bert_dp/modeling.py:366: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", - "Instructions for updating:\n", - "Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/bert_dp/modeling.py:680: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", - "Instructions for updating:\n", - "Use keras.layers.Dense instead.\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/tensorflow_core/python/layers/core.py:187: Layer.apply (from tensorflow.python.keras.engine.base_layer) is deprecated and will be removed in a future version.\n", - "Instructions for updating:\n", - "Please use `layer.__call__` method instead.\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/bert_dp/modeling.py:283: The name tf.erf is deprecated. Please use tf.math.erf instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/models/bert/bert_squad.py:154: The name tf.matrix_band_part is deprecated. Please use tf.linalg.band_part instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/models/bert/bert_squad.py:166: softmax_cross_entropy_with_logits (from tensorflow.python.ops.nn_ops) is deprecated and will be removed in a future version.\n", - "Instructions for updating:\n", - "\n", - "Future major versions of TensorFlow will allow gradients to flow\n", - "into the labels input on backprop by default.\n", - "\n", - "See `tf.nn.softmax_cross_entropy_with_logits_v2`.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/core/models/tf_model.py:234: The name tf.train.AdadeltaOptimizer is deprecated. Please use tf.compat.v1.train.AdadeltaOptimizer instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/core/models/tf_model.py:127: The name tf.get_collection is deprecated. Please use tf.compat.v1.get_collection instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/core/models/tf_model.py:127: The name tf.GraphKeys is deprecated. Please use tf.compat.v1.GraphKeys instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/models/bert/bert_squad.py:89: The name tf.global_variables_initializer is deprecated. Please use tf.compat.v1.global_variables_initializer instead.\n", - "\n", - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/models/bert/bert_squad.py:94: checkpoint_exists (from tensorflow.python.training.checkpoint_management) is deprecated and will be removed in a future version.\n", - "Instructions for updating:\n", - "Use standard file APIs to check for files with this prefix.\n" - ] - }, - { - "output_type": "stream", - "name": "stderr", - "text": [ - "2021-10-14 22:46:59.972 INFO in 'deeppavlov.core.models.tf_model'['tf_model'] at line 51: [loading model from /root/.deeppavlov/models/squad_ru_bert/model_rubert]\n" - ] - }, - { - "output_type": "stream", - "name": "stdout", - "text": [ - "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/deeppavlov/core/models/tf_model.py:54: The name tf.train.Saver is deprecated. Please use tf.compat.v1.train.Saver instead.\n", - "\n", - "INFO:tensorflow:Restoring parameters from /root/.deeppavlov/models/squad_ru_bert/model_rubert\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", @@ -2294,209 +831,148 @@ "id": "l5pDyTRL7rRl" }, "source": [ - "text = \"\"\"Первая многоразовая ступень ракеты-носителя Falcon 9 успешно отделилась через две с половиной минуты после старта и автоматически приземлилась на плавучую платформу Of Course I Still Love You у берегов Флориды. Через 12 минут после запуска космический корабль Crew Dragon вышел на расчетную орбиту и отделился от второй ступени ракеты.\n", - "\n", - "Сближение корабля Crew Dragon с Международной космической станцией запланировано на 31 мая. К стыковочному адаптеру на узловом модуле «Гармония» американского сегмента МКС Crew Dragon должен причалить в ручном или, при необходимости, в автоматическом режиме. Эта процедура запланирована на 10:29 по времени Восточного побережья США (17:29 по московскому времени).\n", - "\n", - "В испытательном полете DM2 астронавт Херли является командиром космического корабля (spacecraft commander), а его напарник Бенкен — командир по операциям стыковки и расстыковки (joint operations commander). Фактически это означает, что именно Херли управляет Crew Dragon в полете к МКС, к которой они должны пристыковаться в течение суток после старта. Херли и Бенкен также будут выполнять необходимые для сертификации НАСА проверки систем корабля в полете.\n", - "\n", - "Во время полета Херли и Бенкен провели небольшую экскурсию по Crew Dragon.\"\"\"\n", - "\n", - "# Source: https://habr.com/ru/news/t/504642/" + "context = (\n", + " 'Первая многоразовая ступень ракеты-носителя Falcon 9 успешно отделилась через две с половиной '\n", + " 'минуты после старта и автоматически приземлилась на плавучую платформу Of Course I Still '\n", + " 'Love You у берегов Флориды. Через 12 минут после запуска космический корабль Crew Dragon '\n", + " 'вышел на расчетную орбиту и отделился от второй ступени ракеты.'\n", + " '\\n\\n'\n", + " 'Сближение корабля Crew Dragon с Международной космической станцией запланировано на 31 мая. '\n", + " 'К стыковочному адаптеру на узловом модуле «Гармония» американского сегмента МКС Crew Dragon '\n", + " 'должен причалить в ручном или, при необходимости, в автоматическом режиме. Эта процедура '\n", + " 'запланирована на 10:29 по времени Восточного побережья США (17:29 по московскому времени).'\n", + " '\\n\\n'\n", + " 'В испытательном полете DM2 астронавт Херли является командиром космического корабля (spacecraft '\n", + " 'commander), а его напарник Бенкен — командир по операциям стыковки и расстыковки (joint '\n", + " 'operations commander). Фактически это означает, что именно Херли управляет Crew Dragon в '\n", + " 'полете к МКС, к которой они должны пристыковаться в течение суток после старта. Херли и Бенкен '\n", + " 'также будут выполнять необходимые для сертификации НАСА проверки систем корабля в полете.'\n", + " '\\n\\n'\n", + " 'Во время полета Херли и Бенкен провели небольшую экскурсию по Crew Dragon.'\n", + ")" ], - "execution_count": 40, + "execution_count": null, "outputs": [] }, { - "cell_type": "code", + "cell_type": "markdown", "metadata": { - "id": "e9Llg3Jb7rRm", - "outputId": "7d49cc67-8868-4fa4-89cb-33a236b1b0d4", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "5tVX9PJ_GPE-" }, "source": [ - "print(text)" - ], - "execution_count": 41, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Первая многоразовая ступень ракеты-носителя Falcon 9 успешно отделилась через две с половиной минуты после старта и автоматически приземлилась на плавучую платформу Of Course I Still Love You у берегов Флориды. Через 12 минут после запуска космический корабль Crew Dragon вышел на расчетную орбиту и отделился от второй ступени ракеты.\n", - "\n", - "Сближение корабля Crew Dragon с Международной космической станцией запланировано на 31 мая. К стыковочному адаптеру на узловом модуле «Гармония» американского сегмента МКС Crew Dragon должен причалить в ручном или, при необходимости, в автоматическом режиме. Эта процедура запланирована на 10:29 по времени Восточного побережья США (17:29 по московскому времени).\n", - "\n", - "В испытательном полете DM2 астронавт Херли является командиром космического корабля (spacecraft commander), а его напарник Бенкен — командир по операциям стыковки и расстыковки (joint operations commander). Фактически это означает, что именно Херли управляет Crew Dragon в полете к МКС, к которой они должны пристыковаться в течение суток после старта. Херли и Бенкен также будут выполнять необходимые для сертификации НАСА проверки систем корабля в полете.\n", - "\n", - "Во время полета Херли и Бенкен провели небольшую экскурсию по Crew Dragon.\n" - ] - } + "And here is how to use deeppavlov's model:" ] }, { "cell_type": "code", "metadata": { - "id": "a8SNVPlk7rRm", - "outputId": "ec147003-7b0c-48ec-c252-3f9c08a63c3d", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "05BDo1IjGFPG" }, "source": [ - "model_ru([text], ['Когда отделилась первая ступень?'])" + "question = 'Когда отделилась первая ступень?'\n", + "model_ru([context], [question])" ], - "execution_count": 42, - "outputs": [ - { - "output_type": "execute_result", - "data": { - "text/plain": [ - "[['через две с половиной минуты после старта'], [72], [2055731.625]]" - ] - }, - "metadata": {}, - "execution_count": 42 - } - ] + "execution_count": null, + "outputs": [] }, { - "cell_type": "code", + "cell_type": "markdown", "metadata": { - "id": "98PIvy4g7rRm", - "outputId": "3fab7b6e-31b8-4704-9bb6-e3a2ff1b63ff", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "yyRAYAc_GxAL" }, "source": [ - "model_ru([text], ['На какую дату запланирована стыковка?'])" - ], - "execution_count": 43, - "outputs": [ - { - "output_type": "execute_result", - "data": { - "text/plain": [ - "[['на 31 мая'], [418], [31752.884765625]]" - ] - }, - "metadata": {}, - "execution_count": 43 - } + "The model returns list with answer, answer starting position in context and the answer logit.\n", + "\n", + "This yields the following `answer_question` function." ] }, { "cell_type": "code", "metadata": { - "id": "K1BK3PAm7rRn", - "outputId": "eddcc670-5fab-49f4-c08a-f85801747d0e", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "UXi5hm_AEFB4" }, "source": [ - "model_ru([text], ['Кто участвует в полете?'])" + "def answer_question_ru(question, context):\n", + " output = model_ru([context], [question])\n", + " return output[0][0]" ], - "execution_count": 44, - "outputs": [ - { - "output_type": "execute_result", - "data": { - "text/plain": [ - "[['астронавт Херли'], [729], [139.62789916992188]]" - ] - }, - "metadata": {}, - "execution_count": 44 - } + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "0wfCi3FvHBuL" + }, + "source": [ + "Let's ask a bunch of other questions to the model." ] }, { "cell_type": "code", "metadata": { - "id": "Ugo2Wyd57rRn", - "outputId": "82312fa9-aede-47b6-8db1-d512391c200d", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "98PIvy4g7rRm" }, "source": [ - "model_ru([text], ['Кто участвует в полете кроме астронавта Херли?'])" + "question = 'На какую дату запланирована стыковка?'\n", + "answer = answer_question_ru(question, context)\n", + "print(f'Ответ: \"{answer}\"')" ], - "execution_count": 45, - "outputs": [ - { - "output_type": "execute_result", - "data": { - "text/plain": [ - "[['Бенкен'], [1063], [13.483261108398438]]" - ] - }, - "metadata": {}, - "execution_count": 45 - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "code", "metadata": { - "id": "I-AwQsIU7rRn", - "outputId": "94c9b358-d85a-4734-8a82-d1328b9beb68", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "K1BK3PAm7rRn" }, "source": [ - "model_ru([text], ['Какая ступень приземлилась на плавучую платформу Of Course I Still Love You?'])" + "question = 'Кто участвует в полете?'\n", + "answer = answer_question_ru(question, context)\n", + "print(f'Ответ: \"{answer}\"')" ], - "execution_count": 46, - "outputs": [ - { - "output_type": "execute_result", - "data": { - "text/plain": [ - "[['Первая многоразовая ступень ракеты-носителя Falcon 9'], [0], [582400.5625]]" - ] - }, - "metadata": {}, - "execution_count": 46 - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "code", "metadata": { - "id": "dMn2sAWL7rRo" + "id": "Ugo2Wyd57rRn" }, "source": [ - "" + "question = 'Кто участвует в полете кроме астронавта Херли?'\n", + "answer = answer_question_ru(question, context)\n", + "print(f'Ответ: \"{answer}\"')" ], - "execution_count": 46, + "execution_count": null, "outputs": [] }, { "cell_type": "code", "metadata": { - "id": "ldHiNgRW7rRo" + "id": "5B4vytlCYTvs" }, "source": [ - "" + "question = 'Какие астронавты участвовали в полете?'\n", + "answer = answer_question_ru(question, context)\n", + "\n", + "# Notice how model finds the appropriate answer dispite slightly different context.\n", + "print(f'Ответ: \"{answer}\"')" ], - "execution_count": 46, + "execution_count": null, "outputs": [] }, { "cell_type": "code", "metadata": { - "id": "IvT6gNk27rRo" + "id": "I-AwQsIU7rRn" }, "source": [ - "" + "question = 'Какая ступень приземлилась на плавучую платформу Of Course I Still Love You?'\n", + "answer = answer_question_ru(question, context)\n", + "print(f'Ответ: \"{answer}\"')" ], - "execution_count": 46, + "execution_count": null, "outputs": [] }, { @@ -2505,848 +981,244 @@ "id": "ZU4ZxB6o7rRp" }, "source": [ - "### Part 4. Text to speech (with Tacotron 2)." + "## Part 4. Question answering with speech using Tacotron 2." ] }, { - "cell_type": "code", + "cell_type": "markdown", "metadata": { - "id": "xDAPjR_Lx-uZ" + "id": "NVstcIVxadEr" }, "source": [ - "import numpy as np\n", - "from scipy.io.wavfile import write" - ], - "execution_count": 47, - "outputs": [] + "### Text to speech using Tacotron 2." + ] }, { - "cell_type": "code", + "cell_type": "markdown", "metadata": { - "id": "wZLptq5F7rRp" + "id": "aoj8MMIJbTji" }, "source": [ - "assert tacotron2 is not None, 'Tacotron2 by NVIDIA requires CUDA-compatible GPU to infer'" - ], - "execution_count": 48, - "outputs": [] + "Tacotron 2 is a network proposed in 2017 in [Natural TTS Synthesis By Conditioning\n", + "Wavenet On Mel Spectrogram Predictions](https://arxiv.org/pdf/1712.05884.pdf) paper. This network takes an input text and maps it into the mel-frequency spectrogram. This spectrogram is then passed through a modified WaveNet (generative model for audio, original paper can be found [here](https://arxiv.org/pdf/1609.03499.pdf)) to generate the actual speech." + ] }, { - "cell_type": "code", + "cell_type": "markdown", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "B1s3RHawyAJ6", - "outputId": "aa35fb1a-f5eb-478f-e252-ed72f1a5ea75" + "id": "btil2I1zejk3" }, "source": [ - "tacotron2 = tacotron2.to(device)\n", - "tacotron2.eval()" - ], - "execution_count": 49, - "outputs": [ - { - "output_type": "execute_result", - "data": { - "text/plain": [ - "Tacotron2(\n", - " (embedding): Embedding(148, 512)\n", - " (encoder): Encoder(\n", - " (convolutions): ModuleList(\n", - " (0): Sequential(\n", - " (0): ConvNorm(\n", - " (conv): Conv1d(512, 512, kernel_size=(5,), stride=(1,), padding=(2,))\n", - " )\n", - " (1): BatchNorm1d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", - " )\n", - " (1): Sequential(\n", - " (0): ConvNorm(\n", - " (conv): Conv1d(512, 512, kernel_size=(5,), stride=(1,), padding=(2,))\n", - " )\n", - " (1): BatchNorm1d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", - " )\n", - " (2): Sequential(\n", - " (0): ConvNorm(\n", - " (conv): Conv1d(512, 512, kernel_size=(5,), stride=(1,), padding=(2,))\n", - " )\n", - " (1): BatchNorm1d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", - " )\n", - " )\n", - " (lstm): LSTM(512, 256, batch_first=True, bidirectional=True)\n", - " )\n", - " (decoder): Decoder(\n", - " (prenet): Prenet(\n", - " (layers): ModuleList(\n", - " (0): LinearNorm(\n", - " (linear_layer): Linear(in_features=80, out_features=256, bias=False)\n", - " )\n", - " (1): LinearNorm(\n", - " (linear_layer): Linear(in_features=256, out_features=256, bias=False)\n", - " )\n", - " )\n", - " )\n", - " (attention_rnn): LSTMCell(768, 1024)\n", - " (attention_layer): Attention(\n", - " (query_layer): LinearNorm(\n", - " (linear_layer): Linear(in_features=1024, out_features=128, bias=False)\n", - " )\n", - " (memory_layer): LinearNorm(\n", - " (linear_layer): Linear(in_features=512, out_features=128, bias=False)\n", - " )\n", - " (v): LinearNorm(\n", - " (linear_layer): Linear(in_features=128, out_features=1, bias=False)\n", - " )\n", - " (location_layer): LocationLayer(\n", - " (location_conv): ConvNorm(\n", - " (conv): Conv1d(2, 32, kernel_size=(31,), stride=(1,), padding=(15,), bias=False)\n", - " )\n", - " (location_dense): LinearNorm(\n", - " (linear_layer): Linear(in_features=32, out_features=128, bias=False)\n", - " )\n", - " )\n", - " )\n", - " (decoder_rnn): LSTMCell(1536, 1024, bias=1)\n", - " (linear_projection): LinearNorm(\n", - " (linear_layer): Linear(in_features=1536, out_features=80, bias=True)\n", - " )\n", - " (gate_layer): LinearNorm(\n", - " (linear_layer): Linear(in_features=1536, out_features=1, bias=True)\n", - " )\n", - " )\n", - " (postnet): Postnet(\n", - " (convolutions): ModuleList(\n", - " (0): Sequential(\n", - " (0): ConvNorm(\n", - " (conv): Conv1d(80, 512, kernel_size=(5,), stride=(1,), padding=(2,))\n", - " )\n", - " (1): BatchNorm1d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", - " )\n", - " (1): Sequential(\n", - " (0): ConvNorm(\n", - " (conv): Conv1d(512, 512, kernel_size=(5,), stride=(1,), padding=(2,))\n", - " )\n", - " (1): BatchNorm1d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", - " )\n", - " (2): Sequential(\n", - " (0): ConvNorm(\n", - " (conv): Conv1d(512, 512, kernel_size=(5,), stride=(1,), padding=(2,))\n", - " )\n", - " (1): BatchNorm1d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", - " )\n", - " (3): Sequential(\n", - " (0): ConvNorm(\n", - " (conv): Conv1d(512, 512, kernel_size=(5,), stride=(1,), padding=(2,))\n", - " )\n", - " (1): BatchNorm1d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", - " )\n", - " (4): Sequential(\n", - " (0): ConvNorm(\n", - " (conv): Conv1d(512, 80, kernel_size=(5,), stride=(1,), padding=(2,))\n", - " )\n", - " (1): BatchNorm1d(80, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n", - " )\n", - " )\n", - " )\n", - ")" - ] - }, - "metadata": {}, - "execution_count": 49 - } + "Let's look more closely at a mel spectrogram (for more info on its nature please refer to the [Tacotron 2 paper](https://arxiv.org/pdf/1712.05884.pdf))." ] }, { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "2y009rzTyBVi", - "outputId": "10277601-fb03-4cab-cb35-0f0d8cd5542b" + "id": "xDAPjR_Lx-uZ" }, "source": [ - "waveglow = torch.hub.load('nvidia/DeepLearningExamples:torchhub', 'nvidia_waveglow')\n", - "waveglow = waveglow.remove_weightnorm(waveglow)\n", - "waveglow = waveglow.to(device)\n", - "waveglow.eval()" + "assert tacotron2 is not None and waveglow is not None, 'Tacotron2 by NVIDIA infers only on GPU, so the Part 4 will not work on CPU-only machine'\n", + "utils = torch.hub.load('NVIDIA/DeepLearningExamples:torchhub', 'nvidia_tts_utils')\n", + "\n", + "text = 'Some test text.'\n", + "sequences, lengths = utils.prepare_input_sequence([text])\n", + "with torch.no_grad():\n", + " mel, _, _ = tacotron2.infer(sequences, lengths)\n", + "\n", + "sns.reset_orig()\n", + "plt.imshow(mel[0].cpu().numpy())\n", + "plt.title('mel-frequency spectrogram');" ], - "execution_count": 50, - "outputs": [ - { - "output_type": "stream", - "name": "stderr", - "text": [ - "Using cache found in /root/.cache/torch/hub/nvidia_DeepLearningExamples_torchhub\n", - "Downloading checkpoint from https://api.ngc.nvidia.com/v2/models/nvidia/waveglow_ckpt_fp32/versions/19.09.0/files/nvidia_waveglowpyt_fp32_20190427\n", - "/root/.cache/torch/hub/nvidia_DeepLearningExamples_torchhub/PyTorch/SpeechSynthesis/Tacotron2/waveglow/model.py:55: UserWarning: torch.qr is deprecated in favor of torch.linalg.qr and will be removed in a future PyTorch release.\n", - "The boolean parameter 'some' has been replaced with a string parameter 'mode'.\n", - "Q, R = torch.qr(A, some)\n", - "should be replaced with\n", - "Q, R = torch.linalg.qr(A, 'reduced' if some else 'complete') (Triggered internally at /pytorch/aten/src/ATen/native/BatchLinearAlgebra.cpp:1940.)\n", - " W = torch.qr(torch.FloatTensor(c, c).normal_())[0]\n" - ] - }, - { - "output_type": "execute_result", - "data": { - "text/plain": [ - "WaveGlow(\n", - " (upsample): ConvTranspose1d(80, 80, kernel_size=(1024,), stride=(256,))\n", - " (WN): ModuleList(\n", - " (0): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(4, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 8, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (1): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(4, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 8, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (2): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(4, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 8, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (3): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(4, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 8, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (4): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(3, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 6, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (5): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(3, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 6, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (6): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(3, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 6, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (7): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(3, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 6, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (8): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(2, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 4, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (9): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(2, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 4, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (10): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(2, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 4, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (11): WN(\n", - " (in_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(2,), dilation=(2,))\n", - " (2): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(4,), dilation=(4,))\n", - " (3): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(8,), dilation=(8,))\n", - " (4): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(16,), dilation=(16,))\n", - " (5): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(32,), dilation=(32,))\n", - " (6): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(64,), dilation=(64,))\n", - " (7): Conv1d(512, 1024, kernel_size=(3,), stride=(1,), padding=(128,), dilation=(128,))\n", - " )\n", - " (res_skip_layers): ModuleList(\n", - " (0): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(512, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(512, 512, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (cond_layers): ModuleList(\n", - " (0): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (1): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (2): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (3): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (4): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (5): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (6): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " (7): Conv1d(640, 1024, kernel_size=(1,), stride=(1,))\n", - " )\n", - " (start): Conv1d(2, 512, kernel_size=(1,), stride=(1,))\n", - " (end): Conv1d(512, 4, kernel_size=(1,), stride=(1,))\n", - " )\n", - " )\n", - " (convinv): ModuleList(\n", - " (0): Invertible1x1Conv(\n", - " (conv): Conv1d(8, 8, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (1): Invertible1x1Conv(\n", - " (conv): Conv1d(8, 8, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (2): Invertible1x1Conv(\n", - " (conv): Conv1d(8, 8, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (3): Invertible1x1Conv(\n", - " (conv): Conv1d(8, 8, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (4): Invertible1x1Conv(\n", - " (conv): Conv1d(6, 6, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (5): Invertible1x1Conv(\n", - " (conv): Conv1d(6, 6, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (6): Invertible1x1Conv(\n", - " (conv): Conv1d(6, 6, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (7): Invertible1x1Conv(\n", - " (conv): Conv1d(6, 6, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (8): Invertible1x1Conv(\n", - " (conv): Conv1d(4, 4, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (9): Invertible1x1Conv(\n", - " (conv): Conv1d(4, 4, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (10): Invertible1x1Conv(\n", - " (conv): Conv1d(4, 4, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " (11): Invertible1x1Conv(\n", - " (conv): Conv1d(4, 4, kernel_size=(1,), stride=(1,), bias=False)\n", - " )\n", - " )\n", - ")" - ] - }, - "metadata": {}, - "execution_count": 50 - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", "metadata": { - "id": "83WLbVnv7rRq" + "id": "9odRMQS3fISF" }, "source": [ - "Let's take a look at [Mail.ru group blog post on Computer Vision on habr.com](https://habr.com/ru/company/mailru/blog/467905/)" + "After obtaining this spectrogram, we can generate the audio with `waveglow` model." ] }, { "cell_type": "code", "metadata": { - "id": "m2eMzsMY7rRq" + "id": "BdFfCjmsUUxQ" }, "source": [ - "text = \"\"\"One of Mail.ru Cloud’s objectives is to provide the handiest means for accessing and searching your own photo and video archives. For this purpose, we at Mail.ru Computer Vision Team have created and implemented systems for smart image processing: search by object, by scene, by face, etc. Another spectacular technology is landmark recognition. Today, I am going to tell you how we made this a reality using Deep Learning.\n", - "\n", - "Imagine the situation: you return from your vacation with a load of photos. Talking to your friends, you are asked to show a picture of a place worth seeing, like palace, castle, pyramid, temple, lake, waterfall, mountain, and so on. You rush to scroll your gallery folder trying to find one that is really good. Most likely, it is lost amongst hundreds of images, and you say you will show it later.\n", + "from IPython.display import Audio\n", "\n", - "We solve this problem by grouping user photos in albums. This will let you find pictures you need just in few clicks. Now we have albums compiled by face, by object and by scene, and also by landmark.\n", + "sampling_rate = 22050\n", "\n", - "Photos with landmarks are essential because they often capture highlights of our lives (journeys, for example). These can be pictures with some architecture or wilderness in the background. This is why we seek to locate such images and make them readily available to users.\n", - "\"\"\"\n", + "with torch.no_grad():\n", + " audio = waveglow.infer(mel)\n", "\n", - "# source: https://habr.com/ru/company/mailru/blog/467905/" + "audio_numpy = audio[0].cpu().numpy()\n", + "Audio(audio_numpy, rate=sampling_rate)" ], - "execution_count": 51, + "execution_count": null, "outputs": [] }, { - "cell_type": "code", + "cell_type": "markdown", "metadata": { - "id": "zH2d6QX17rRq", - "outputId": "d2faf80b-be76-41a6-ca1b-4b4bcb2b217d", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "W0mnDWpdhpdi" }, "source": [ - "print(wrapper.fill(text))" - ], - "execution_count": 52, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "One of Mail.ru Cloud’s objectives is to provide the handiest means for accessing\n", - "and searching your own photo and video archives. For this purpose, we at Mail.ru\n", - "Computer Vision Team have created and implemented systems for smart image\n", - "processing: search by object, by scene, by face, etc. Another spectacular\n", - "technology is landmark recognition. Today, I am going to tell you how we made\n", - "this a reality using Deep Learning. Imagine the situation: you return from your\n", - "vacation with a load of photos. Talking to your friends, you are asked to show a\n", - "picture of a place worth seeing, like palace, castle, pyramid, temple, lake,\n", - "waterfall, mountain, and so on. You rush to scroll your gallery folder trying to\n", - "find one that is really good. Most likely, it is lost amongst hundreds of\n", - "images, and you say you will show it later. We solve this problem by grouping\n", - "user photos in albums. This will let you find pictures you need just in few\n", - "clicks. Now we have albums compiled by face, by object and by scene, and also by\n", - "landmark. Photos with landmarks are essential because they often capture\n", - "highlights of our lives (journeys, for example). These can be pictures with some\n", - "architecture or wilderness in the background. This is why we seek to locate such\n", - "images and make them readily available to users.\n" - ] - } + "We've generated a `.wav` format audio. We can save it using the `scipy.io.wavfile.write`." ] }, { "cell_type": "code", "metadata": { - "id": "4tkwZk-B7rRq", - "outputId": "d2d3e580-5089-4f7a-d3c9-38e9bf34333a", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "rTMNu9Krh2cW" }, "source": [ - "question = \"How search is performed?\"\n", + "from scipy.io.wavfile import write\n", "\n", - "ans = answer_question(question, text)" + "write('audio.wav', sampling_rate, audio_numpy)" ], - "execution_count": 53, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Answer: \"search by object , by scene , by face\"\n" - ] - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "markdown", "metadata": { - "id": "GBWNS3pE7rRr" + "id": "0pjEZy4TfT3w" }, "source": [ - "Let's simply use the pre-trained model to generate audio" + "This yields the following `text_to_speech` function." ] }, { "cell_type": "code", "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "2QQIZteNycoD", - "outputId": "ed77e2fc-6317-4a68-86fc-d388fcf103f1" + "id": "YEvDynkPVscj" }, "source": [ - "from IPython.display import Audio\n", - "utils = torch.hub.load('NVIDIA/DeepLearningExamples:torchhub', 'nvidia_tts_utils')\n", - "\n", - "def get_audio(phrase, rate=22050, audio_name='audio.wav'):\n", + "def text_to_speech(text):\n", " # preprocessing\n", + " sequences, lengths = utils.prepare_input_sequence([text])\n", "\n", - " sequences, lengths = utils.prepare_input_sequence([phrase])\n", " # run the models\n", " with torch.no_grad():\n", " mel, _, _ = tacotron2.infer(sequences, lengths)\n", " audio = waveglow.infer(mel)\n", - " audio_numpy = audio[0].data.cpu().numpy()\n", - " rate = rate\n", - " write(audio_name, rate, audio_numpy)\n", - " return Audio(audio_numpy, rate=rate)" + "\n", + " audio_numpy = audio[0].cpu().numpy()\n", + " return audio_numpy" ], - "execution_count": 74, - "outputs": [ - { - "output_type": "stream", - "name": "stderr", - "text": [ - "Using cache found in /root/.cache/torch/hub/NVIDIA_DeepLearningExamples_torchhub\n" - ] - } + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "code", + "metadata": { + "id": "RwqwZoxsWNmq" + }, + "source": [ + "text = 'Another test text.'\n", + "audio_numpy = text_to_speech(text)\n", + "Audio(audio_numpy, rate=sampling_rate)" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "gYittYwlfZfU" + }, + "source": [ + "### Tying text to speech with question answering." + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "83WLbVnv7rRq" + }, + "source": [ + "Let's take a look at [Mail.ru group blog post on Computer Vision on habr.com](https://habr.com/ru/company/mailru/blog/467905/)" ] }, { "cell_type": "code", "metadata": { - "id": "Bvo-0pR77rRr", - "outputId": "8228a6f3-98d4-4b09-ad7b-70b1d98bc904", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "m2eMzsMY7rRq" }, "source": [ - "question = \"Why photos with landmarks are essential?\"\n", - "\n", - "ans = answer_question(question, text)" + "context = (\n", + " 'One of Mail.ru Cloud’s objectives is to provide the handiest means for accessing '\n", + " 'and searching your own photo and video archives. For this purpose, we at Mail.ru '\n", + " 'Computer Vision Team have created and implemented systems for smart image '\n", + " 'processing: search by object, by scene, by face, etc. Another spectacular '\n", + " 'technology is landmark recognition. Today, I am going to tell you how we made '\n", + " 'this a reality using Deep Learning.'\n", + " '\\n\\n'\n", + " 'Imagine the situation: you return from your vacation with a load of photos. Talking '\n", + " 'to your friends, you are asked to show a picture of a place worth seeing, like '\n", + " 'palace, castle, pyramid, temple, lake, waterfall, mountain, and so on. You rush to '\n", + " 'scroll your gallery folder trying to find one that is really good. Most likely, it '\n", + " 'is lost amongst hundreds of images, and you say you will show it later.'\n", + " '\\n\\n'\n", + " 'We solve this problem by grouping user photos in albums. This will let you find '\n", + " 'pictures you need just in few clicks. Now we have albums compiled by face, by '\n", + " 'object and by scene, and also by landmark.'\n", + " '\\n\\n'\n", + " 'Photos with landmarks are essential because they often capture highlights of our '\n", + " 'lives (journeys, for example). These can be pictures with some architecture or '\n", + " 'wilderness in the background. This is why we seek to locate such images and make '\n", + " 'them readily available to users.'\n", + ")" ], - "execution_count": 75, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Answer: \"because they often capture highlights of our lives\"\n" - ] - } + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "code", + "metadata": { + "id": "4tkwZk-B7rRq" + }, + "source": [ + "question = 'Why photos with landmarks are essential?'\n", + "answer = answer_question(question, context)\n", + "print(f'Answer: \"{answer}\"')" + ], + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "chBm8WdIh_Bc" + }, + "source": [ + "Let's cat question and answer into one phrase and convert it to audio!" ] }, { "cell_type": "code", "metadata": { - "id": "j9NhT0Np7rRr", - "outputId": "dce5129b-ec6e-4a6b-fe18-c126f6ba78ed", - "colab": { - "base_uri": "https://localhost:8080/", - "height": 73 - } + "id": "j9NhT0Np7rRr" }, "source": [ - "phrase = 'Your question is: {}\\n Answer is: {}'.format(question, ans)\n", - "get_audio(phrase)" + "text = f'{question}\\n{answer}'\n", + "audio_numpy = text_to_speech(text)\n", + "Audio(audio_numpy, rate=sampling_rate)" ], - "execution_count": 76, - "outputs": [ - { - "output_type": "execute_result", - "data": { - "text/html": [ - "\n", - " \n", - " " - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "execution_count": 76 - } + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "cFDgT4OuijIp" + }, + "source": [ + "And another one." ] }, { @@ -3356,10 +1228,12 @@ }, "source": [ "question = \"Which places except mountain are worth seeing?\"\n", + "answer = answer_question(question, context)\n", + "print(f'Answer: \"{answer}\"')\n", "\n", - "ans = answer_question(question, text)\n", - "phrase = '{}\\n {}'.format(question, ans)\n", - "get_audio(phrase)" + "text = f'{question}\\n{answer}'\n", + "audio_numpy = text_to_speech(text)\n", + "Audio(audio_numpy, rate=sampling_rate)" ], "execution_count": null, "outputs": [] @@ -3385,33 +1259,12 @@ ] }, { - "cell_type": "code", + "cell_type": "markdown", "metadata": { - "id": "R-orfjjL7rRs", - "outputId": "5c6ff25c-a10d-4d93-c59f-bca7aee05f57", - "colab": { - "base_uri": "https://localhost:8080/" - } + "id": "_0uhvcBhj2k6" }, "source": [ - "!pip install -q torchaudio omegaconf\n" - ], - "execution_count": 61, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "\u001b[K |████████████████████████████████| 1.9 MB 11.9 MB/s \n", - "\u001b[K |████████████████████████████████| 74 kB 3.1 MB/s \n", - "\u001b[K |████████████████████████████████| 831.4 MB 6.8 kB/s \n", - "\u001b[K |████████████████████████████████| 112 kB 51.2 MB/s \n", - "\u001b[?25h Building wheel for antlr4-python3-runtime (setup.py) ... \u001b[?25l\u001b[?25hdone\n", - "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n", - "torchvision 0.10.0+cu111 requires torch==1.9.0, but you have torch 1.9.1 which is incompatible.\n", - "torchtext 0.10.0 requires torch==1.9.0, but you have torch 1.9.1 which is incompatible.\u001b[0m\n" - ] - } + "Of course, text to speech is not specific to english language. Here is how you can do it with russian." ] }, { @@ -3420,192 +1273,82 @@ "id": "TD79JX0g7rRs" }, "source": [ - "import numpy as np\n", - "from scipy.io.wavfile import write\n", - "\n", - "import torch\n", - "from pprint import pprint\n", "from omegaconf import OmegaConf\n", - "from IPython.display import Audio, display" - ], - "execution_count": 62, - "outputs": [] - }, - { - "cell_type": "code", - "metadata": { - "id": "jnFrVq3l7rRs", - "outputId": "2adc2bf8-61e9-45ba-8548-f05bff5a08fb", - "colab": { - "base_uri": "https://localhost:8080/" - } - }, - "source": [ - "torch.hub.download_url_to_file('https://raw.githubusercontent.com/snakers4/silero-models/master/models.yml',\n", - " 'latest_silero_models.yml',\n", - " progress=False)\n", + "\n", + "torch.hub.download_url_to_file(\n", + " 'https://raw.githubusercontent.com/snakers4/silero-models/master/models.yml',\n", + " 'latest_silero_models.yml',\n", + " progress=False\n", + ")\n", "models = OmegaConf.load('latest_silero_models.yml')\n", "\n", "# see latest avaiable models\n", - "available_languages = list(models.tts_models.keys())\n", + "available_languages = list(models['tts_models'].keys())\n", "print(f'Available languages {available_languages}')\n", "\n", "for lang in available_languages:\n", - " speakers = list(models.tts_models.get(lang).keys())\n", + " speakers = list(models['tts_models'][lang].keys())\n", " print(f'Available speakers for {lang}: {speakers}')" ], - "execution_count": 63, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Available languages ['ru', 'en', 'de', 'es', 'fr', 'ba', 'xal', 'tt', 'uz', 'multi']\n", - "Available speakers for ru: ['aidar_v2', 'aidar_8khz', 'aidar_16khz', 'baya_v2', 'baya_8khz', 'baya_16khz', 'irina_v2', 'irina_8khz', 'irina_16khz', 'kseniya_v2', 'kseniya_8khz', 'kseniya_16khz', 'natasha_v2', 'natasha_8khz', 'natasha_16khz', 'ruslan_v2', 'ruslan_8khz', 'ruslan_16khz']\n", - "Available speakers for en: ['lj_v2', 'lj_8khz', 'lj_16khz']\n", - "Available speakers for de: ['thorsten_v2', 'thorsten_8khz', 'thorsten_16khz']\n", - "Available speakers for es: ['tux_v2', 'tux_8khz', 'tux_16khz']\n", - "Available speakers for fr: ['gilles_v2', 'gilles_8khz', 'gilles_16khz']\n", - "Available speakers for ba: ['aigul_v2']\n", - "Available speakers for xal: ['erdni_v2']\n", - "Available speakers for tt: ['dilyara_v2']\n", - "Available speakers for uz: ['dilnavoz_v2']\n", - "Available speakers for multi: ['multi_v2']\n" - ] - } + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "ZVaR1xG8k94K" + }, + "source": [ + "Let's choose our language and speaker and try using them!" ] }, { "cell_type": "code", "metadata": { - "id": "zKCT72on7rRt", - "outputId": "2022cf35-c757-4d78-e134-10b64ebe6e39", - "colab": { - "base_uri": "https://localhost:8080/", - "height": 140, - "referenced_widgets": [ - "019b4f79cede42e89bdf3b2f5047a3bf", - "934f348be42346bca1e374cec6f7acac", - "14686b543b9349119fc7cec9c0f60963", - "bc8fb4da9de84df6ab7605b2b7d2d32f", - "f25f21412946491ab11381dbe23cccd1", - "0fedb09e3c9d4a6eb47d08e4bc013e54", - "ad07800df53e4feba295d0202e17bba9", - "87c33c91fc584bfbbfe6ea9a61e8b1b2", - "ad8a0ff477c94faa9a9d3ed4ca8fddf3", - "7b11de7d759d490791097ef1019848f3", - "ad6595b0760144d8899f6a2e1d41ed24" - ] - } + "id": "zKCT72on7rRt" }, "source": [ "language = 'ru'\n", "speaker = 'kseniya_16khz'\n", "device = torch.device('cpu')\n", - "model, symbols, sample_rate, example_text, apply_tts = torch.hub.load(repo_or_dir='snakers4/silero-models',\n", - " model='silero_tts',\n", - " language=language,\n", - " speaker=speaker)\n", - "model = model.to(device) # gpu or cpu\n", + "model, symbols, sample_rate, example_text, apply_tts = torch.hub.load(\n", + " 'snakers4/silero-models', 'silero_tts',\n", + " language=language, speaker=speaker\n", + ")\n", + "model = model.to(device)\n", "\n", "\n", - "audio = apply_tts(texts=[example_text],\n", - " model=model,\n", - " sample_rate=sample_rate,\n", - " symbols=symbols,\n", - " device=device)\n", + "audio = apply_tts(\n", + " texts=[example_text],\n", + " model=model,\n", + " sample_rate=sample_rate,\n", + " symbols=symbols,\n", + " device=device\n", + ")\n", "\n", "print(example_text)\n", - "display(Audio(audio[0], rate=sample_rate))" + "Audio(audio[0], rate=sample_rate)" ], - "execution_count": 64, - "outputs": [ - { - "output_type": "stream", - "name": "stderr", - "text": [ - "Downloading: \"https://github.com/snakers4/silero-models/archive/master.zip\" to /root/.cache/torch/hub/master.zip\n" - ] - }, - { - "output_type": "display_data", - "data": { - "application/vnd.jupyter.widget-view+json": { - "model_id": "019b4f79cede42e89bdf3b2f5047a3bf", - "version_minor": 0, - "version_major": 2 - }, - "text/plain": [ - " 0%| | 0.00/136M [00:00\n", - " \n", - " Your browser does not support the audio element.\n", - " \n", - " " - ], - "text/plain": [ - "" - ] - }, - "metadata": {} - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "code", "metadata": { - "id": "U0O3eCX87rRt", - "outputId": "4cac2c8d-0d52-47f7-c0f8-46d9cae7b82b", - "colab": { - "base_uri": "https://localhost:8080/", - "height": 73 - } + "id": "U0O3eCX87rRt" }, "source": [ - "audio = apply_tts(texts=[\"Дерзайте знать! Спасибо за внимание!\"],\n", - " model=model,\n", - " sample_rate=sample_rate,\n", - " symbols=symbols,\n", - " device=device)\n", - "\n", - "display(Audio(audio[0], rate=sample_rate))" + "audio = apply_tts(\n", + " texts=[\"Дерзайте знать! Спасибо за внимание!\"],\n", + " model=model,\n", + " sample_rate=sample_rate,\n", + " symbols=symbols,\n", + " device=device\n", + ")\n", + "Audio(audio[0], rate=sample_rate)" ], - "execution_count": 65, - "outputs": [ - { - "output_type": "display_data", - "data": { - "text/html": [ - "\n", - " \n", - " " - ], - "text/plain": [ - "" - ] - }, - "metadata": {} - } - ] + "execution_count": null, + "outputs": [] }, { "cell_type": "code",