From c12f51fbec6741267941dda9d903d6c556f05d9d Mon Sep 17 00:00:00 2001 From: BMO <68750272+mohamedsolaiman@users.noreply.github.com> Date: Fri, 2 May 2025 02:05:15 +0300 Subject: [PATCH] Created using Colab --- DiffRhythm_gradio_jupyter.ipynb | 545 ++++++++++++++++++++++++++++++++ 1 file changed, 545 insertions(+) create mode 100644 DiffRhythm_gradio_jupyter.ipynb diff --git a/DiffRhythm_gradio_jupyter.ipynb b/DiffRhythm_gradio_jupyter.ipynb new file mode 100644 index 0000000..92877ed --- /dev/null +++ b/DiffRhythm_gradio_jupyter.ipynb @@ -0,0 +1,545 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": { + "id": "view-in-github", + "colab_type": "text" + }, + "source": [ + "\"Open" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "VjYy0F2gZIPR", + "outputId": "ef0cd9c1-67a4-4de7-a7d6-b53983df6edb", + "colab": { + "base_uri": "https://localhost:8080/" + } + }, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "/content\n", + "Cloning into 'DiffRhythm-hf'...\n", + "remote: Enumerating objects: 297, done.\u001b[K\n", + "remote: Counting objects: 100% (297/297), done.\u001b[K\n", + "remote: Compressing objects: 100% (169/169), done.\u001b[K\n", + "remote: Total 297 (delta 129), reused 290 (delta 125), pack-reused 0 (from 0)\u001b[K\n", + "Receiving objects: 100% (297/297), 12.54 MiB | 16.19 MiB/s, done.\n", + "Resolving deltas: 100% (129/129), done.\n", + "Downloading diffrhythm/g2p/sources/chinese_lexicon.txt (15 MB)\n", + "Error downloading object: diffrhythm/g2p/sources/chinese_lexicon.txt (a3a7685): Smudge error: Error downloading diffrhythm/g2p/sources/chinese_lexicon.txt (a3a7685d1c3e68eb2fa304bfc63e90c90c3c1a1948839a5b1b507b2131b3e2fb): [a3a7685d1c3e68eb2fa304bfc63e90c90c3c1a1948839a5b1b507b2131b3e2fb] Object does not exist on the server: [404] Object does not exist on the server\n", + "\n", + "Errors logged to /content/DiffRhythm-hf/.git/lfs/logs/20250501T230059.191257575.log\n", + "Use `git lfs logs last` to view the log.\n", + "error: external filter 'git-lfs filter-process' failed\n", + "fatal: diffrhythm/g2p/sources/chinese_lexicon.txt: smudge filter lfs failed\n", + "warning: Clone succeeded, but checkout failed.\n", + "You can inspect what was checked out with 'git status'\n", + "and retry with 'git restore --source=HEAD :/'\n", + "\n", + "Reading package lists... Done\n", + "Building dependency tree... Done\n", + "Reading state information... Done\n", + "The following additional packages will be installed:\n", + " espeak-ng-data libespeak-ng1 libpcaudio0 libsonic0\n", + "The following NEW packages will be installed:\n", + " espeak-ng espeak-ng-data libespeak-ng1 libpcaudio0 libsonic0\n", + "0 upgraded, 5 newly installed, 0 to remove and 34 not upgraded.\n", + "Need to get 4,526 kB of archives.\n", + "After this operation, 11.9 MB of additional disk space will be used.\n", + "Get:1 http://archive.ubuntu.com/ubuntu jammy/main amd64 libpcaudio0 amd64 1.1-6build2 [8,956 B]\n", + "Get:2 http://archive.ubuntu.com/ubuntu jammy/main amd64 libsonic0 amd64 0.2.0-11build1 [10.3 kB]\n", + "Get:3 http://archive.ubuntu.com/ubuntu jammy-updates/main amd64 espeak-ng-data amd64 1.50+dfsg-10ubuntu0.1 [3,956 kB]\n", + "Get:4 http://archive.ubuntu.com/ubuntu jammy-updates/main amd64 libespeak-ng1 amd64 1.50+dfsg-10ubuntu0.1 [207 kB]\n", + "Get:5 http://archive.ubuntu.com/ubuntu jammy-updates/universe amd64 espeak-ng amd64 1.50+dfsg-10ubuntu0.1 [343 kB]\n", + "Fetched 4,526 kB in 2s (2,903 kB/s)\n", + "Selecting previously unselected package libpcaudio0:amd64.\n", + "(Reading database ... 126101 files and directories currently installed.)\n", + "Preparing to unpack .../libpcaudio0_1.1-6build2_amd64.deb ...\n", + "Unpacking libpcaudio0:amd64 (1.1-6build2) ...\n", + "Selecting previously unselected package libsonic0:amd64.\n", + "Preparing to unpack .../libsonic0_0.2.0-11build1_amd64.deb ...\n", + "Unpacking libsonic0:amd64 (0.2.0-11build1) ...\n", + "Selecting previously unselected package espeak-ng-data:amd64.\n", + "Preparing to unpack .../espeak-ng-data_1.50+dfsg-10ubuntu0.1_amd64.deb ...\n", + "Unpacking espeak-ng-data:amd64 (1.50+dfsg-10ubuntu0.1) ...\n", + "Selecting previously unselected package libespeak-ng1:amd64.\n", + "Preparing to unpack .../libespeak-ng1_1.50+dfsg-10ubuntu0.1_amd64.deb ...\n", + "Unpacking libespeak-ng1:amd64 (1.50+dfsg-10ubuntu0.1) ...\n", + "Selecting previously unselected package espeak-ng.\n", + "Preparing to unpack .../espeak-ng_1.50+dfsg-10ubuntu0.1_amd64.deb ...\n", + "Unpacking espeak-ng (1.50+dfsg-10ubuntu0.1) ...\n", + "Setting up libpcaudio0:amd64 (1.1-6build2) ...\n", + "Setting up libsonic0:amd64 (0.2.0-11build1) ...\n", + "Setting up espeak-ng-data:amd64 (1.50+dfsg-10ubuntu0.1) ...\n", + "Setting up libespeak-ng1:amd64 (1.50+dfsg-10ubuntu0.1) ...\n", + "Setting up espeak-ng (1.50+dfsg-10ubuntu0.1) ...\n", + "Processing triggers for man-db (2.10.2-1) ...\n", + "Processing triggers for libc-bin (2.35-0ubuntu3.8) ...\n", + "/sbin/ldconfig.real: /usr/local/lib/libtbb.so.12 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libhwloc.so.15 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libur_adapter_level_zero.so.0 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libtbbbind_2_0.so.3 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libtbbbind_2_5.so.3 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libtcm.so.1 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libtcm_debug.so.1 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libtbbmalloc.so.2 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libur_adapter_opencl.so.0 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libumf.so.0 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libtbbmalloc_proxy.so.2 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libur_loader.so.0 is not a symbolic link\n", + "\n", + "/sbin/ldconfig.real: /usr/local/lib/libtbbbind.so.3 is not a symbolic link\n", + "\n", + "Collecting numpy==2.0\n", + " Downloading numpy-2.0.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (60 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m60.9/60.9 kB\u001b[0m \u001b[31m2.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hCollecting gradio\n", + " Downloading gradio-5.28.0-py3-none-any.whl.metadata (16 kB)\n", + "Collecting muq\n", + " Downloading muq-0.1.0.tar.gz (55 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m55.8/55.8 kB\u001b[0m \u001b[31m5.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", + "Collecting mutagen\n", + " Downloading mutagen-1.47.0-py3-none-any.whl.metadata (1.7 kB)\n", + "Collecting torchdiffeq\n", + " Downloading torchdiffeq-0.2.5-py3-none-any.whl.metadata (440 bytes)\n", + "Collecting x-transformers\n", + " Downloading x_transformers-2.3.1-py3-none-any.whl.metadata (88 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m88.7/88.7 kB\u001b[0m \u001b[31m8.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hCollecting pyopenjtalk\n", + " Downloading pyopenjtalk-0.4.1.tar.gz (1.4 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.4/1.4 MB\u001b[0m \u001b[31m50.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25h Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n", + " Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n", + " Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", + "Collecting pykakasi\n", + " Downloading pykakasi-2.3.0-py3-none-any.whl.metadata (5.9 kB)\n", + "Collecting cn2an\n", + " Downloading cn2an-0.5.23-py3-none-any.whl.metadata (10 kB)\n", + "Collecting pypinyin\n", + " Downloading pypinyin-0.54.0-py2.py3-none-any.whl.metadata (12 kB)\n", + "Collecting onnxruntime\n", + " Downloading onnxruntime-1.21.1-cp311-cp311-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl.metadata (4.5 kB)\n", + "Collecting unidecode\n", + " Downloading Unidecode-1.4.0-py3-none-any.whl.metadata (13 kB)\n", + "Collecting phonemizer\n", + " Downloading phonemizer-3.3.0-py3-none-any.whl.metadata (48 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m48.2/48.2 kB\u001b[0m \u001b[31m5.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hCollecting LangSegment\n", + " Downloading langsegment-0.2.0-py3-none-any.whl.metadata (1.1 kB)\n", + "Collecting aiofiles<25.0,>=22.0 (from gradio)\n", + " Downloading aiofiles-24.1.0-py3-none-any.whl.metadata (10 kB)\n", + "Requirement already satisfied: anyio<5.0,>=3.0 in /usr/local/lib/python3.11/dist-packages (from gradio) (4.9.0)\n", + "Collecting fastapi<1.0,>=0.115.2 (from gradio)\n", + " Downloading fastapi-0.115.12-py3-none-any.whl.metadata (27 kB)\n", + "Collecting ffmpy (from gradio)\n", + " Downloading ffmpy-0.5.0-py3-none-any.whl.metadata (3.0 kB)\n", + "Collecting gradio-client==1.10.0 (from gradio)\n", + " Downloading gradio_client-1.10.0-py3-none-any.whl.metadata (7.1 kB)\n", + "Collecting groovy~=0.1 (from gradio)\n", + " Downloading groovy-0.1.2-py3-none-any.whl.metadata (6.1 kB)\n", + "Requirement already satisfied: httpx>=0.24.1 in /usr/local/lib/python3.11/dist-packages (from gradio) (0.28.1)\n", + "Requirement already satisfied: huggingface-hub>=0.28.1 in /usr/local/lib/python3.11/dist-packages (from gradio) (0.30.2)\n", + "Requirement already satisfied: jinja2<4.0 in /usr/local/lib/python3.11/dist-packages (from gradio) (3.1.6)\n", + "Requirement already satisfied: markupsafe<4.0,>=2.0 in /usr/local/lib/python3.11/dist-packages (from gradio) (3.0.2)\n", + "Requirement already satisfied: orjson~=3.0 in /usr/local/lib/python3.11/dist-packages (from gradio) (3.10.17)\n", + "Requirement already satisfied: packaging in /usr/local/lib/python3.11/dist-packages (from gradio) (24.2)\n", + "Requirement already satisfied: pandas<3.0,>=1.0 in /usr/local/lib/python3.11/dist-packages (from gradio) (2.2.2)\n", + "Requirement already satisfied: pillow<12.0,>=8.0 in /usr/local/lib/python3.11/dist-packages (from gradio) (11.2.1)\n", + "Requirement already satisfied: pydantic<2.12,>=2.0 in /usr/local/lib/python3.11/dist-packages (from gradio) (2.11.3)\n", + "Collecting pydub (from gradio)\n", + " Downloading pydub-0.25.1-py2.py3-none-any.whl.metadata (1.4 kB)\n", + "Collecting python-multipart>=0.0.18 (from gradio)\n", + " Downloading python_multipart-0.0.20-py3-none-any.whl.metadata (1.8 kB)\n", + "Requirement already satisfied: pyyaml<7.0,>=5.0 in /usr/local/lib/python3.11/dist-packages (from gradio) (6.0.2)\n", + "Collecting ruff>=0.9.3 (from gradio)\n", + " Downloading ruff-0.11.8-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (25 kB)\n", + "Collecting safehttpx<0.2.0,>=0.1.6 (from gradio)\n", + " Downloading safehttpx-0.1.6-py3-none-any.whl.metadata (4.2 kB)\n", + "Collecting semantic-version~=2.0 (from gradio)\n", + " Downloading semantic_version-2.10.0-py2.py3-none-any.whl.metadata (9.7 kB)\n", + "Collecting starlette<1.0,>=0.40.0 (from gradio)\n", + " Downloading starlette-0.46.2-py3-none-any.whl.metadata (6.2 kB)\n", + "Collecting tomlkit<0.14.0,>=0.12.0 (from gradio)\n", + " Downloading tomlkit-0.13.2-py3-none-any.whl.metadata (2.7 kB)\n", + "Requirement already satisfied: typer<1.0,>=0.12 in /usr/local/lib/python3.11/dist-packages (from gradio) (0.15.3)\n", + "Requirement already satisfied: typing-extensions~=4.0 in /usr/local/lib/python3.11/dist-packages (from gradio) (4.13.2)\n", + "Collecting uvicorn>=0.14.0 (from gradio)\n", + " Downloading uvicorn-0.34.2-py3-none-any.whl.metadata (6.5 kB)\n", + "Requirement already satisfied: fsspec in /usr/local/lib/python3.11/dist-packages (from gradio-client==1.10.0->gradio) (2025.3.2)\n", + "Requirement already satisfied: websockets<16.0,>=10.0 in /usr/local/lib/python3.11/dist-packages (from gradio-client==1.10.0->gradio) (15.0.1)\n", + "Requirement already satisfied: einops in /usr/local/lib/python3.11/dist-packages (from muq) (0.8.1)\n", + "Requirement already satisfied: librosa in /usr/local/lib/python3.11/dist-packages (from muq) (0.11.0)\n", + "Collecting nnAudio (from muq)\n", + " Downloading nnAudio-0.3.3-py3-none-any.whl.metadata (771 bytes)\n", + "Requirement already satisfied: soundfile in /usr/local/lib/python3.11/dist-packages (from muq) (0.13.1)\n", + "Requirement already satisfied: torch in /usr/local/lib/python3.11/dist-packages (from muq) (2.6.0+cu124)\n", + "Requirement already satisfied: torchaudio in /usr/local/lib/python3.11/dist-packages (from muq) (2.6.0+cu124)\n", + "Requirement already satisfied: tqdm in /usr/local/lib/python3.11/dist-packages (from muq) (4.67.1)\n", + "Requirement already satisfied: transformers in /usr/local/lib/python3.11/dist-packages (from muq) (4.51.3)\n", + "Requirement already satisfied: easydict in /usr/local/lib/python3.11/dist-packages (from muq) (1.13)\n", + "Collecting x_clip (from muq)\n", + " Downloading x_clip-0.14.4-py3-none-any.whl.metadata (724 bytes)\n", + "Requirement already satisfied: scipy>=1.4.0 in /usr/local/lib/python3.11/dist-packages (from torchdiffeq) (1.15.2)\n", + "Collecting einx>=0.3.0 (from x-transformers)\n", + " Downloading einx-0.3.0-py3-none-any.whl.metadata (6.9 kB)\n", + "Collecting loguru (from x-transformers)\n", + " Downloading loguru-0.7.3-py3-none-any.whl.metadata (22 kB)\n", + "Collecting jaconv (from pykakasi)\n", + " Downloading jaconv-0.4.0.tar.gz (17 kB)\n", + " Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n", + "Requirement already satisfied: deprecated in /usr/local/lib/python3.11/dist-packages (from pykakasi) (1.2.18)\n", + "Collecting proces>=0.1.7 (from cn2an)\n", + " Downloading proces-0.1.7-py3-none-any.whl.metadata (3.3 kB)\n", + "Collecting coloredlogs (from onnxruntime)\n", + " Downloading coloredlogs-15.0.1-py2.py3-none-any.whl.metadata (12 kB)\n", + "Requirement already satisfied: flatbuffers in /usr/local/lib/python3.11/dist-packages (from onnxruntime) (25.2.10)\n", + "Requirement already satisfied: protobuf in /usr/local/lib/python3.11/dist-packages (from onnxruntime) (5.29.4)\n", + "Requirement already satisfied: sympy in /usr/local/lib/python3.11/dist-packages (from onnxruntime) (1.13.1)\n", + "Requirement already satisfied: joblib in /usr/local/lib/python3.11/dist-packages (from phonemizer) (1.4.2)\n", + "Collecting segments (from phonemizer)\n", + " Downloading segments-2.3.0-py2.py3-none-any.whl.metadata (3.5 kB)\n", + "Requirement already satisfied: attrs>=18.1 in /usr/local/lib/python3.11/dist-packages (from phonemizer) (25.3.0)\n", + "Collecting dlinfo (from phonemizer)\n", + " Downloading dlinfo-2.0.0-py3-none-any.whl.metadata (1.1 kB)\n", + "Collecting py3langid>=0.2.2 (from LangSegment)\n", + " Downloading py3langid-0.3.0-py3-none-any.whl.metadata (13 kB)\n", + "Requirement already satisfied: idna>=2.8 in /usr/local/lib/python3.11/dist-packages (from anyio<5.0,>=3.0->gradio) (3.10)\n", + "Requirement already satisfied: sniffio>=1.1 in /usr/local/lib/python3.11/dist-packages (from anyio<5.0,>=3.0->gradio) (1.3.1)\n", + "Requirement already satisfied: frozendict in /usr/local/lib/python3.11/dist-packages (from einx>=0.3.0->x-transformers) (2.4.6)\n", + "Requirement already satisfied: certifi in /usr/local/lib/python3.11/dist-packages (from httpx>=0.24.1->gradio) (2025.4.26)\n", + "Requirement already satisfied: httpcore==1.* in /usr/local/lib/python3.11/dist-packages (from httpx>=0.24.1->gradio) (1.0.9)\n", + "Requirement already satisfied: h11>=0.16 in /usr/local/lib/python3.11/dist-packages (from httpcore==1.*->httpx>=0.24.1->gradio) (0.16.0)\n", + "Requirement already satisfied: filelock in /usr/local/lib/python3.11/dist-packages (from huggingface-hub>=0.28.1->gradio) (3.18.0)\n", + "Requirement already satisfied: requests in /usr/local/lib/python3.11/dist-packages (from huggingface-hub>=0.28.1->gradio) (2.32.3)\n", + "Requirement already satisfied: python-dateutil>=2.8.2 in /usr/local/lib/python3.11/dist-packages (from pandas<3.0,>=1.0->gradio) (2.9.0.post0)\n", + "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.11/dist-packages (from pandas<3.0,>=1.0->gradio) (2025.2)\n", + "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.11/dist-packages (from pandas<3.0,>=1.0->gradio) (2025.2)\n", + "Requirement already satisfied: annotated-types>=0.6.0 in /usr/local/lib/python3.11/dist-packages (from pydantic<2.12,>=2.0->gradio) (0.7.0)\n", + "Requirement already satisfied: pydantic-core==2.33.1 in /usr/local/lib/python3.11/dist-packages (from pydantic<2.12,>=2.0->gradio) (2.33.1)\n", + "Requirement already satisfied: typing-inspection>=0.4.0 in /usr/local/lib/python3.11/dist-packages (from pydantic<2.12,>=2.0->gradio) (0.4.0)\n", + "Requirement already satisfied: networkx in /usr/local/lib/python3.11/dist-packages (from torch->muq) (3.4.2)\n", + "Collecting nvidia-cuda-nvrtc-cu12==12.4.127 (from torch->muq)\n", + " Downloading nvidia_cuda_nvrtc_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl.metadata (1.5 kB)\n", + "Collecting nvidia-cuda-runtime-cu12==12.4.127 (from torch->muq)\n", + " Downloading nvidia_cuda_runtime_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl.metadata (1.5 kB)\n", + "Collecting nvidia-cuda-cupti-cu12==12.4.127 (from torch->muq)\n", + " Downloading nvidia_cuda_cupti_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl.metadata (1.6 kB)\n", + "Collecting nvidia-cudnn-cu12==9.1.0.70 (from torch->muq)\n", + " Downloading nvidia_cudnn_cu12-9.1.0.70-py3-none-manylinux2014_x86_64.whl.metadata (1.6 kB)\n", + "Collecting nvidia-cublas-cu12==12.4.5.8 (from torch->muq)\n", + " Downloading nvidia_cublas_cu12-12.4.5.8-py3-none-manylinux2014_x86_64.whl.metadata (1.5 kB)\n", + "Collecting nvidia-cufft-cu12==11.2.1.3 (from torch->muq)\n", + " Downloading nvidia_cufft_cu12-11.2.1.3-py3-none-manylinux2014_x86_64.whl.metadata (1.5 kB)\n", + "Collecting nvidia-curand-cu12==10.3.5.147 (from torch->muq)\n", + " Downloading nvidia_curand_cu12-10.3.5.147-py3-none-manylinux2014_x86_64.whl.metadata (1.5 kB)\n", + "Collecting nvidia-cusolver-cu12==11.6.1.9 (from torch->muq)\n", + " Downloading nvidia_cusolver_cu12-11.6.1.9-py3-none-manylinux2014_x86_64.whl.metadata (1.6 kB)\n", + "Collecting nvidia-cusparse-cu12==12.3.1.170 (from torch->muq)\n", + " Downloading nvidia_cusparse_cu12-12.3.1.170-py3-none-manylinux2014_x86_64.whl.metadata (1.6 kB)\n", + "Requirement already satisfied: nvidia-cusparselt-cu12==0.6.2 in /usr/local/lib/python3.11/dist-packages (from torch->muq) (0.6.2)\n", + "Requirement already satisfied: nvidia-nccl-cu12==2.21.5 in /usr/local/lib/python3.11/dist-packages (from torch->muq) (2.21.5)\n", + "Requirement already satisfied: nvidia-nvtx-cu12==12.4.127 in /usr/local/lib/python3.11/dist-packages (from torch->muq) (12.4.127)\n", + "Collecting nvidia-nvjitlink-cu12==12.4.127 (from torch->muq)\n", + " Downloading nvidia_nvjitlink_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl.metadata (1.5 kB)\n", + "Requirement already satisfied: triton==3.2.0 in /usr/local/lib/python3.11/dist-packages (from torch->muq) (3.2.0)\n", + "Requirement already satisfied: mpmath<1.4,>=1.1.0 in /usr/local/lib/python3.11/dist-packages (from sympy->onnxruntime) (1.3.0)\n", + "Requirement already satisfied: click>=8.0.0 in /usr/local/lib/python3.11/dist-packages (from typer<1.0,>=0.12->gradio) (8.1.8)\n", + "Requirement already satisfied: shellingham>=1.3.0 in /usr/local/lib/python3.11/dist-packages (from typer<1.0,>=0.12->gradio) (1.5.4)\n", + "Requirement already satisfied: rich>=10.11.0 in /usr/local/lib/python3.11/dist-packages (from typer<1.0,>=0.12->gradio) (13.9.4)\n", + "Collecting humanfriendly>=9.1 (from coloredlogs->onnxruntime)\n", + " Downloading humanfriendly-10.0-py2.py3-none-any.whl.metadata (9.2 kB)\n", + "Requirement already satisfied: wrapt<2,>=1.10 in /usr/local/lib/python3.11/dist-packages (from deprecated->pykakasi) (1.17.2)\n", + "Requirement already satisfied: audioread>=2.1.9 in /usr/local/lib/python3.11/dist-packages (from librosa->muq) (3.0.1)\n", + "Requirement already satisfied: numba>=0.51.0 in /usr/local/lib/python3.11/dist-packages (from librosa->muq) (0.60.0)\n", + "Requirement already satisfied: scikit-learn>=1.1.0 in /usr/local/lib/python3.11/dist-packages (from librosa->muq) (1.6.1)\n", + "Requirement already satisfied: decorator>=4.3.0 in /usr/local/lib/python3.11/dist-packages (from librosa->muq) (4.4.2)\n", + "Requirement already satisfied: pooch>=1.1 in /usr/local/lib/python3.11/dist-packages (from librosa->muq) (1.8.2)\n", + "Requirement already satisfied: soxr>=0.3.2 in /usr/local/lib/python3.11/dist-packages (from librosa->muq) (0.5.0.post1)\n", + "Requirement already satisfied: lazy_loader>=0.1 in /usr/local/lib/python3.11/dist-packages (from librosa->muq) (0.4)\n", + "Requirement already satisfied: msgpack>=1.0 in /usr/local/lib/python3.11/dist-packages (from librosa->muq) (1.1.0)\n", + "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.11/dist-packages (from soundfile->muq) (1.17.1)\n", + "Requirement already satisfied: regex in /usr/local/lib/python3.11/dist-packages (from segments->phonemizer) (2024.11.6)\n", + "Collecting csvw>=1.5.6 (from segments->phonemizer)\n", + " Downloading csvw-3.5.1-py2.py3-none-any.whl.metadata (10 kB)\n", + "Requirement already satisfied: tokenizers<0.22,>=0.21 in /usr/local/lib/python3.11/dist-packages (from transformers->muq) (0.21.1)\n", + "Requirement already satisfied: safetensors>=0.4.3 in /usr/local/lib/python3.11/dist-packages (from transformers->muq) (0.5.3)\n", + "Collecting beartype (from x_clip->muq)\n", + " Downloading beartype-0.20.2-py3-none-any.whl.metadata (33 kB)\n", + "Collecting ftfy (from x_clip->muq)\n", + " Downloading ftfy-6.3.1-py3-none-any.whl.metadata (7.3 kB)\n", + "Requirement already satisfied: torchvision in /usr/local/lib/python3.11/dist-packages (from x_clip->muq) (0.21.0+cu124)\n", + "Requirement already satisfied: pycparser in /usr/local/lib/python3.11/dist-packages (from cffi>=1.0->soundfile->muq) (2.22)\n", + "Collecting isodate (from csvw>=1.5.6->segments->phonemizer)\n", + " Downloading isodate-0.7.2-py3-none-any.whl.metadata (11 kB)\n", + "Collecting rfc3986<2 (from csvw>=1.5.6->segments->phonemizer)\n", + " Downloading rfc3986-1.5.0-py2.py3-none-any.whl.metadata (6.5 kB)\n", + "Requirement already satisfied: uritemplate>=3.0.0 in /usr/local/lib/python3.11/dist-packages (from csvw>=1.5.6->segments->phonemizer) (4.1.1)\n", + "Requirement already satisfied: babel in /usr/local/lib/python3.11/dist-packages (from csvw>=1.5.6->segments->phonemizer) (2.17.0)\n", + "Collecting language-tags (from csvw>=1.5.6->segments->phonemizer)\n", + " Downloading language_tags-1.2.0-py3-none-any.whl.metadata (2.1 kB)\n", + "Collecting rdflib (from csvw>=1.5.6->segments->phonemizer)\n", + " Downloading rdflib-7.1.4-py3-none-any.whl.metadata (11 kB)\n", + "Collecting colorama (from csvw>=1.5.6->segments->phonemizer)\n", + " Downloading colorama-0.4.6-py2.py3-none-any.whl.metadata (17 kB)\n", + "Requirement already satisfied: jsonschema in /usr/local/lib/python3.11/dist-packages (from csvw>=1.5.6->segments->phonemizer) (4.23.0)\n", + "Requirement already satisfied: llvmlite<0.44,>=0.43.0dev0 in /usr/local/lib/python3.11/dist-packages (from numba>=0.51.0->librosa->muq) (0.43.0)\n", + "Requirement already satisfied: platformdirs>=2.5.0 in /usr/local/lib/python3.11/dist-packages (from pooch>=1.1->librosa->muq) (4.3.7)\n", + "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.11/dist-packages (from python-dateutil>=2.8.2->pandas<3.0,>=1.0->gradio) (1.17.0)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.11/dist-packages (from requests->huggingface-hub>=0.28.1->gradio) (3.4.1)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.11/dist-packages (from requests->huggingface-hub>=0.28.1->gradio) (2.4.0)\n", + "Requirement already satisfied: markdown-it-py>=2.2.0 in /usr/local/lib/python3.11/dist-packages (from rich>=10.11.0->typer<1.0,>=0.12->gradio) (3.0.0)\n", + "Requirement already satisfied: pygments<3.0.0,>=2.13.0 in /usr/local/lib/python3.11/dist-packages (from rich>=10.11.0->typer<1.0,>=0.12->gradio) (2.19.1)\n", + "Requirement already satisfied: threadpoolctl>=3.1.0 in /usr/local/lib/python3.11/dist-packages (from scikit-learn>=1.1.0->librosa->muq) (3.6.0)\n", + "Requirement already satisfied: wcwidth in /usr/local/lib/python3.11/dist-packages (from ftfy->x_clip->muq) (0.2.13)\n", + "Requirement already satisfied: mdurl~=0.1 in /usr/local/lib/python3.11/dist-packages (from markdown-it-py>=2.2.0->rich>=10.11.0->typer<1.0,>=0.12->gradio) (0.1.2)\n", + "Requirement already satisfied: jsonschema-specifications>=2023.03.6 in /usr/local/lib/python3.11/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer) (2025.4.1)\n", + "Requirement already satisfied: referencing>=0.28.4 in /usr/local/lib/python3.11/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer) (0.36.2)\n", + "Requirement already satisfied: rpds-py>=0.7.1 in /usr/local/lib/python3.11/dist-packages (from jsonschema->csvw>=1.5.6->segments->phonemizer) (0.24.0)\n", + "Requirement already satisfied: pyparsing<4,>=2.1.0 in /usr/local/lib/python3.11/dist-packages (from rdflib->csvw>=1.5.6->segments->phonemizer) (3.2.3)\n", + "Downloading numpy-2.0.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (19.3 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m19.3/19.3 MB\u001b[0m \u001b[31m116.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading gradio-5.28.0-py3-none-any.whl (54.1 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m54.1/54.1 MB\u001b[0m \u001b[31m20.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading gradio_client-1.10.0-py3-none-any.whl (322 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m322.9/322.9 kB\u001b[0m \u001b[31m31.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading mutagen-1.47.0-py3-none-any.whl (194 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m194.4/194.4 kB\u001b[0m \u001b[31m21.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading torchdiffeq-0.2.5-py3-none-any.whl (32 kB)\n", + "Downloading x_transformers-2.3.1-py3-none-any.whl (83 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m83.2/83.2 kB\u001b[0m \u001b[31m8.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading pykakasi-2.3.0-py3-none-any.whl (2.4 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m2.4/2.4 MB\u001b[0m \u001b[31m97.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading cn2an-0.5.23-py3-none-any.whl (224 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m224.9/224.9 kB\u001b[0m \u001b[31m26.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading pypinyin-0.54.0-py2.py3-none-any.whl (837 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m837.0/837.0 kB\u001b[0m \u001b[31m55.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading onnxruntime-1.21.1-cp311-cp311-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl (16.0 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m16.0/16.0 MB\u001b[0m \u001b[31m119.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading Unidecode-1.4.0-py3-none-any.whl (235 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m235.8/235.8 kB\u001b[0m \u001b[31m24.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading phonemizer-3.3.0-py3-none-any.whl (103 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m103.8/103.8 kB\u001b[0m \u001b[31m11.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading langsegment-0.2.0-py3-none-any.whl (5.9 kB)\n", + "Downloading aiofiles-24.1.0-py3-none-any.whl (15 kB)\n", + "Downloading einx-0.3.0-py3-none-any.whl (102 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m103.0/103.0 kB\u001b[0m \u001b[31m13.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading fastapi-0.115.12-py3-none-any.whl (95 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m95.2/95.2 kB\u001b[0m \u001b[31m10.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading groovy-0.1.2-py3-none-any.whl (14 kB)\n", + "Downloading proces-0.1.7-py3-none-any.whl (137 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m137.7/137.7 kB\u001b[0m \u001b[31m15.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading py3langid-0.3.0-py3-none-any.whl (746 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m746.1/746.1 kB\u001b[0m \u001b[31m56.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading python_multipart-0.0.20-py3-none-any.whl (24 kB)\n", + "Downloading ruff-0.11.8-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (11.5 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m11.5/11.5 MB\u001b[0m \u001b[31m126.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading safehttpx-0.1.6-py3-none-any.whl (8.7 kB)\n", + "Downloading semantic_version-2.10.0-py2.py3-none-any.whl (15 kB)\n", + "Downloading starlette-0.46.2-py3-none-any.whl (72 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m72.0/72.0 kB\u001b[0m \u001b[31m8.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading tomlkit-0.13.2-py3-none-any.whl (37 kB)\n", + "Downloading nvidia_cublas_cu12-12.4.5.8-py3-none-manylinux2014_x86_64.whl (363.4 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m363.4/363.4 MB\u001b[0m \u001b[31m4.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nvidia_cuda_cupti_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl (13.8 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m13.8/13.8 MB\u001b[0m \u001b[31m110.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nvidia_cuda_nvrtc_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl (24.6 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m24.6/24.6 MB\u001b[0m \u001b[31m98.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nvidia_cuda_runtime_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl (883 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m883.7/883.7 kB\u001b[0m \u001b[31m50.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nvidia_cudnn_cu12-9.1.0.70-py3-none-manylinux2014_x86_64.whl (664.8 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m664.8/664.8 MB\u001b[0m \u001b[31m3.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nvidia_cufft_cu12-11.2.1.3-py3-none-manylinux2014_x86_64.whl (211.5 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m211.5/211.5 MB\u001b[0m \u001b[31m5.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nvidia_curand_cu12-10.3.5.147-py3-none-manylinux2014_x86_64.whl (56.3 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m56.3/56.3 MB\u001b[0m \u001b[31m11.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nvidia_cusolver_cu12-11.6.1.9-py3-none-manylinux2014_x86_64.whl (127.9 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m127.9/127.9 MB\u001b[0m \u001b[31m7.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nvidia_cusparse_cu12-12.3.1.170-py3-none-manylinux2014_x86_64.whl (207.5 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m207.5/207.5 MB\u001b[0m \u001b[31m5.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nvidia_nvjitlink_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl (21.1 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m21.1/21.1 MB\u001b[0m \u001b[31m101.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading uvicorn-0.34.2-py3-none-any.whl (62 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m62.5/62.5 kB\u001b[0m \u001b[31m7.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading coloredlogs-15.0.1-py2.py3-none-any.whl (46 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m46.0/46.0 kB\u001b[0m \u001b[31m4.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading dlinfo-2.0.0-py3-none-any.whl (3.7 kB)\n", + "Downloading ffmpy-0.5.0-py3-none-any.whl (6.0 kB)\n", + "Downloading loguru-0.7.3-py3-none-any.whl (61 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m61.6/61.6 kB\u001b[0m \u001b[31m7.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading nnAudio-0.3.3-py3-none-any.whl (43 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m43.6/43.6 kB\u001b[0m \u001b[31m4.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading pydub-0.25.1-py2.py3-none-any.whl (32 kB)\n", + "Downloading segments-2.3.0-py2.py3-none-any.whl (15 kB)\n", + "Downloading x_clip-0.14.4-py3-none-any.whl (1.4 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.4/1.4 MB\u001b[0m \u001b[31m74.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading csvw-3.5.1-py2.py3-none-any.whl (59 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m59.9/59.9 kB\u001b[0m \u001b[31m6.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading humanfriendly-10.0-py2.py3-none-any.whl (86 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m86.8/86.8 kB\u001b[0m \u001b[31m10.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading beartype-0.20.2-py3-none-any.whl (1.2 MB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m1.2/1.2 MB\u001b[0m \u001b[31m80.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading ftfy-6.3.1-py3-none-any.whl (44 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m44.8/44.8 kB\u001b[0m \u001b[31m4.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading rfc3986-1.5.0-py2.py3-none-any.whl (31 kB)\n", + "Downloading colorama-0.4.6-py2.py3-none-any.whl (25 kB)\n", + "Downloading isodate-0.7.2-py3-none-any.whl (22 kB)\n", + "Downloading language_tags-1.2.0-py3-none-any.whl (213 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m213.4/213.4 kB\u001b[0m \u001b[31m22.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hDownloading rdflib-7.1.4-py3-none-any.whl (565 kB)\n", + "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m565.1/565.1 kB\u001b[0m \u001b[31m51.7 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n", + "\u001b[?25hBuilding wheels for collected packages: muq, pyopenjtalk, jaconv\n", + " Building wheel for muq (setup.py) ... \u001b[?25l\u001b[?25hdone\n", + " Created wheel for muq: filename=muq-0.1.0-py3-none-any.whl size=60109 sha256=fadbd01a6ecaef712e4ba0e01dcca41935c820ba2dd99ec13e49abc4626bea34\n", + " Stored in directory: /root/.cache/pip/wheels/5b/2a/5b/5f5cec7c5bc1016af62bbc82f0b28e597fdbbc8aab32f1e874\n", + " Building wheel for pyopenjtalk (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n", + " Created wheel for pyopenjtalk: filename=pyopenjtalk-0.4.1-cp311-cp311-linux_x86_64.whl size=5767104 sha256=6b43f75189ad1fdd75eb4e3818ada14bdbb9b04bc995560694aa80b8bcf47627\n", + " Stored in directory: /root/.cache/pip/wheels/1e/c0/4f/d17fa12db5fee142d7455b1af3c5ad45b751e038a2e926fb41\n", + " Building wheel for jaconv (setup.py) ... \u001b[?25l\u001b[?25hdone\n", + " Created wheel for jaconv: filename=jaconv-0.4.0-py3-none-any.whl size=18228 sha256=15b7470b1ef2f482e940ce50e03003bec2f1068e41f3049ff8fdd1c74317ed6e\n", + " Stored in directory: /root/.cache/pip/wheels/1c/63/71/95fb322fe9047ed7e61b007c47cbf03d23ecb77dd03665f151\n", + "Successfully built muq pyopenjtalk jaconv\n", + "Installing collected packages: rfc3986, pydub, language-tags, jaconv, uvicorn, unidecode, tomlkit, semantic-version, ruff, rdflib, python-multipart, pypinyin, proces, nvidia-nvjitlink-cu12, nvidia-curand-cu12, nvidia-cufft-cu12, nvidia-cuda-runtime-cu12, nvidia-cuda-nvrtc-cu12, nvidia-cuda-cupti-cu12, nvidia-cublas-cu12, numpy, mutagen, loguru, isodate, humanfriendly, groovy, ftfy, ffmpy, dlinfo, colorama, beartype, aiofiles, starlette, pyopenjtalk, pykakasi, py3langid, nvidia-cusparse-cu12, nvidia-cudnn-cu12, einx, coloredlogs, cn2an, safehttpx, onnxruntime, nvidia-cusolver-cu12, LangSegment, gradio-client, fastapi, gradio, csvw, x-transformers, torchdiffeq, segments, nnAudio, x_clip, phonemizer, muq\n", + " Attempting uninstall: nvidia-nvjitlink-cu12\n", + " Found existing installation: nvidia-nvjitlink-cu12 12.5.82\n", + " Uninstalling nvidia-nvjitlink-cu12-12.5.82:\n", + " Successfully uninstalled nvidia-nvjitlink-cu12-12.5.82\n", + " Attempting uninstall: nvidia-curand-cu12\n", + " Found existing installation: nvidia-curand-cu12 10.3.6.82\n", + " Uninstalling nvidia-curand-cu12-10.3.6.82:\n", + " Successfully uninstalled nvidia-curand-cu12-10.3.6.82\n", + " Attempting uninstall: nvidia-cufft-cu12\n", + " Found existing installation: nvidia-cufft-cu12 11.2.3.61\n", + " Uninstalling nvidia-cufft-cu12-11.2.3.61:\n", + " Successfully uninstalled nvidia-cufft-cu12-11.2.3.61\n", + " Attempting uninstall: nvidia-cuda-runtime-cu12\n", + " Found existing installation: nvidia-cuda-runtime-cu12 12.5.82\n", + " Uninstalling nvidia-cuda-runtime-cu12-12.5.82:\n", + " Successfully uninstalled nvidia-cuda-runtime-cu12-12.5.82\n", + " Attempting uninstall: nvidia-cuda-nvrtc-cu12\n", + " Found existing installation: nvidia-cuda-nvrtc-cu12 12.5.82\n", + " Uninstalling nvidia-cuda-nvrtc-cu12-12.5.82:\n", + " Successfully uninstalled nvidia-cuda-nvrtc-cu12-12.5.82\n", + " Attempting uninstall: nvidia-cuda-cupti-cu12\n", + " Found existing installation: nvidia-cuda-cupti-cu12 12.5.82\n", + " Uninstalling nvidia-cuda-cupti-cu12-12.5.82:\n", + " Successfully uninstalled nvidia-cuda-cupti-cu12-12.5.82\n", + " Attempting uninstall: nvidia-cublas-cu12\n", + " Found existing installation: nvidia-cublas-cu12 12.5.3.2\n", + " Uninstalling nvidia-cublas-cu12-12.5.3.2:\n", + " Successfully uninstalled nvidia-cublas-cu12-12.5.3.2\n", + " Attempting uninstall: numpy\n", + " Found existing installation: numpy 2.0.2\n", + " Uninstalling numpy-2.0.2:\n", + " Successfully uninstalled numpy-2.0.2\n", + " Attempting uninstall: nvidia-cusparse-cu12\n", + " Found existing installation: nvidia-cusparse-cu12 12.5.1.3\n", + " Uninstalling nvidia-cusparse-cu12-12.5.1.3:\n", + " Successfully uninstalled nvidia-cusparse-cu12-12.5.1.3\n", + " Attempting uninstall: nvidia-cudnn-cu12\n", + " Found existing installation: nvidia-cudnn-cu12 9.3.0.75\n", + " Uninstalling nvidia-cudnn-cu12-9.3.0.75:\n", + " Successfully uninstalled nvidia-cudnn-cu12-9.3.0.75\n", + " Attempting uninstall: nvidia-cusolver-cu12\n", + " Found existing installation: nvidia-cusolver-cu12 11.6.3.83\n", + " Uninstalling nvidia-cusolver-cu12-11.6.3.83:\n", + " Successfully uninstalled nvidia-cusolver-cu12-11.6.3.83\n", + "Successfully installed LangSegment-0.2.0 aiofiles-24.1.0 beartype-0.20.2 cn2an-0.5.23 colorama-0.4.6 coloredlogs-15.0.1 csvw-3.5.1 dlinfo-2.0.0 einx-0.3.0 fastapi-0.115.12 ffmpy-0.5.0 ftfy-6.3.1 gradio-5.28.0 gradio-client-1.10.0 groovy-0.1.2 humanfriendly-10.0 isodate-0.7.2 jaconv-0.4.0 language-tags-1.2.0 loguru-0.7.3 muq-0.1.0 mutagen-1.47.0 nnAudio-0.3.3 numpy-2.0.0 nvidia-cublas-cu12-12.4.5.8 nvidia-cuda-cupti-cu12-12.4.127 nvidia-cuda-nvrtc-cu12-12.4.127 nvidia-cuda-runtime-cu12-12.4.127 nvidia-cudnn-cu12-9.1.0.70 nvidia-cufft-cu12-11.2.1.3 nvidia-curand-cu12-10.3.5.147 nvidia-cusolver-cu12-11.6.1.9 nvidia-cusparse-cu12-12.3.1.170 nvidia-nvjitlink-cu12-12.4.127 onnxruntime-1.21.1 phonemizer-3.3.0 proces-0.1.7 py3langid-0.3.0 pydub-0.25.1 pykakasi-2.3.0 pyopenjtalk-0.4.1 pypinyin-0.54.0 python-multipart-0.0.20 rdflib-7.1.4 rfc3986-1.5.0 ruff-0.11.8 safehttpx-0.1.6 segments-2.3.0 semantic-version-2.10.0 starlette-0.46.2 tomlkit-0.13.2 torchdiffeq-0.2.5 unidecode-1.4.0 uvicorn-0.34.2 x-transformers-2.3.1 x_clip-0.14.4\n", + "/content/DiffRhythm-hf/diffrhythm/g2p/sources/g2p_chinese_model\n", + "--2025-05-01 23:04:18-- https://huggingface.co/spaces/ASLP-lab/DiffRhythm/resolve/main/diffrhythm/g2p/sources/g2p_chinese_model/poly_bert_model.onnx\n", + "Resolving huggingface.co (huggingface.co)... 108.138.246.85, 108.138.246.79, 108.138.246.71, ...\n", + "Connecting to huggingface.co (huggingface.co)|108.138.246.85|:443... connected.\n", + "HTTP request sent, awaiting response... 302 Found\n", + "Location: https://cdn-lfs-us-1.hf.co/repos/37/b4/37b407b8ae2187727ad0422f857c6963abd45187c60a6986807a6186835b66ca/8765d835ffdf9811c832d4dc7b6a552757aa8615c01d1184db716a50c20aebbc?response-content-disposition=inline%3B+filename*%3DUTF-8%27%27poly_bert_model.onnx%3B+filename%3D%22poly_bert_model.onnx%22%3B&Expires=1746144258&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTc0NjE0NDI1OH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy11cy0xLmhmLmNvL3JlcG9zLzM3L2I0LzM3YjQwN2I4YWUyMTg3NzI3YWQwNDIyZjg1N2M2OTYzYWJkNDUxODdjNjBhNjk4NjgwN2E2MTg2ODM1YjY2Y2EvODc2NWQ4MzVmZmRmOTgxMWM4MzJkNGRjN2I2YTU1Mjc1N2FhODYxNWMwMWQxMTg0ZGI3MTZhNTBjMjBhZWJiYz9yZXNwb25zZS1jb250ZW50LWRpc3Bvc2l0aW9uPSoifV19&Signature=ntzfYElDwihWHvlMBIhAUi1Ao%7E8%7E76livViTuy%7EXkDeEq7T-vj1TsbmfWnXVO8bCQuMIm8JmvJBFb05cj9Bo4a1GqpzlB47PDpta2i7DFaELmDR-lfRCcl3KonpxW%7EMFNbcsMOkigzBYMotCa-aQRa49k2zqk9H7XJFU%7EwFdWVGSBSsd5QZVpo1hPvTtrMFY6MG5vr0hjSKALS4K%7E8shohSKUTWaDq%7E31p6sjQeWZOMTsc00DniPGi1T0ej0a0nh6VMRfOMPDr8ipZ6ogQjfH8OjJaGlZlsMUOcNy7tyLn-o6gGzO6UezeC4pJR9YgWDeN0cl%7EnmqYtI7aglOOQvEA__&Key-Pair-Id=K24J24Z295AEI9 [following]\n", + "--2025-05-01 23:04:18-- https://cdn-lfs-us-1.hf.co/repos/37/b4/37b407b8ae2187727ad0422f857c6963abd45187c60a6986807a6186835b66ca/8765d835ffdf9811c832d4dc7b6a552757aa8615c01d1184db716a50c20aebbc?response-content-disposition=inline%3B+filename*%3DUTF-8%27%27poly_bert_model.onnx%3B+filename%3D%22poly_bert_model.onnx%22%3B&Expires=1746144258&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTc0NjE0NDI1OH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy11cy0xLmhmLmNvL3JlcG9zLzM3L2I0LzM3YjQwN2I4YWUyMTg3NzI3YWQwNDIyZjg1N2M2OTYzYWJkNDUxODdjNjBhNjk4NjgwN2E2MTg2ODM1YjY2Y2EvODc2NWQ4MzVmZmRmOTgxMWM4MzJkNGRjN2I2YTU1Mjc1N2FhODYxNWMwMWQxMTg0ZGI3MTZhNTBjMjBhZWJiYz9yZXNwb25zZS1jb250ZW50LWRpc3Bvc2l0aW9uPSoifV19&Signature=ntzfYElDwihWHvlMBIhAUi1Ao%7E8%7E76livViTuy%7EXkDeEq7T-vj1TsbmfWnXVO8bCQuMIm8JmvJBFb05cj9Bo4a1GqpzlB47PDpta2i7DFaELmDR-lfRCcl3KonpxW%7EMFNbcsMOkigzBYMotCa-aQRa49k2zqk9H7XJFU%7EwFdWVGSBSsd5QZVpo1hPvTtrMFY6MG5vr0hjSKALS4K%7E8shohSKUTWaDq%7E31p6sjQeWZOMTsc00DniPGi1T0ej0a0nh6VMRfOMPDr8ipZ6ogQjfH8OjJaGlZlsMUOcNy7tyLn-o6gGzO6UezeC4pJR9YgWDeN0cl%7EnmqYtI7aglOOQvEA__&Key-Pair-Id=K24J24Z295AEI9\n", + "Resolving cdn-lfs-us-1.hf.co (cdn-lfs-us-1.hf.co)... 18.155.192.108, 18.155.192.121, 18.155.192.93, ...\n", + "Connecting to cdn-lfs-us-1.hf.co (cdn-lfs-us-1.hf.co)|18.155.192.108|:443... connected.\n", + "HTTP request sent, awaiting response... 200 OK\n", + "Length: 76583333 (73M) [binary/octet-stream]\n", + "Saving to: ‘poly_bert_model.onnx’\n", + "\n", + "poly_bert_model.onn 100%[===================>] 73.04M 99.1MB/s in 0.7s \n", + "\n", + "2025-05-01 23:04:19 (99.1 MB/s) - ‘poly_bert_model.onnx’ saved [76583333/76583333]\n", + "\n", + "/content/DiffRhythm-hf/src\n", + "--2025-05-01 23:04:19-- https://huggingface.co/spaces/ASLP-lab/DiffRhythm/resolve/main/src/negative_prompt.npy\n", + "Resolving huggingface.co (huggingface.co)... 108.138.246.79, 108.138.246.71, 108.138.246.85, ...\n", + "Connecting to huggingface.co (huggingface.co)|108.138.246.79|:443... connected.\n", + "HTTP request sent, awaiting response... 302 Found\n", + "Location: https://cdn-lfs-us-1.hf.co/repos/37/b4/37b407b8ae2187727ad0422f857c6963abd45187c60a6986807a6186835b66ca/6cb7d74eb7a8eda12acb8247b21d373928301db8a8cb0db480d341799fed3ce5?response-content-disposition=inline%3B+filename*%3DUTF-8%27%27negative_prompt.npy%3B+filename%3D%22negative_prompt.npy%22%3B&Expires=1746144259&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTc0NjE0NDI1OX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy11cy0xLmhmLmNvL3JlcG9zLzM3L2I0LzM3YjQwN2I4YWUyMTg3NzI3YWQwNDIyZjg1N2M2OTYzYWJkNDUxODdjNjBhNjk4NjgwN2E2MTg2ODM1YjY2Y2EvNmNiN2Q3NGViN2E4ZWRhMTJhY2I4MjQ3YjIxZDM3MzkyODMwMWRiOGE4Y2IwZGI0ODBkMzQxNzk5ZmVkM2NlNT9yZXNwb25zZS1jb250ZW50LWRpc3Bvc2l0aW9uPSoifV19&Signature=GIn6Y3ANrUIfvpRTEbXeWIRL8JLV7WglVttgKugFF9obn1IkIyTbQ1kUcezN16Uw0hZtt1JrWMKjY2SlgO3WsA4nMBCKqFf1MZcs6uZ75-6kfb7g3w4K55XByJMDHT3BuV4bx6dRGPYa8FP0mLl54Ua5Z%7EF6KnwpRkhW6qyaxfl0f1Veo7AHOCIJ5DEChZrUcAlHYjX7jQC82NxSZ2pVoLnvljpqeMKS4yO02MBKwttEbklSD5LZ0lKTvCgGNqwslLq5wQTwSw3ZM6dlY%7Ee5DM5GJO9%7EhBK5EtsBB9dAVUwlCGHhc-kgUtLfAxH5riXL2LhTHkIMgij3IxCAQy5ENw__&Key-Pair-Id=K24J24Z295AEI9 [following]\n", + "--2025-05-01 23:04:19-- https://cdn-lfs-us-1.hf.co/repos/37/b4/37b407b8ae2187727ad0422f857c6963abd45187c60a6986807a6186835b66ca/6cb7d74eb7a8eda12acb8247b21d373928301db8a8cb0db480d341799fed3ce5?response-content-disposition=inline%3B+filename*%3DUTF-8%27%27negative_prompt.npy%3B+filename%3D%22negative_prompt.npy%22%3B&Expires=1746144259&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTc0NjE0NDI1OX19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy11cy0xLmhmLmNvL3JlcG9zLzM3L2I0LzM3YjQwN2I4YWUyMTg3NzI3YWQwNDIyZjg1N2M2OTYzYWJkNDUxODdjNjBhNjk4NjgwN2E2MTg2ODM1YjY2Y2EvNmNiN2Q3NGViN2E4ZWRhMTJhY2I4MjQ3YjIxZDM3MzkyODMwMWRiOGE4Y2IwZGI0ODBkMzQxNzk5ZmVkM2NlNT9yZXNwb25zZS1jb250ZW50LWRpc3Bvc2l0aW9uPSoifV19&Signature=GIn6Y3ANrUIfvpRTEbXeWIRL8JLV7WglVttgKugFF9obn1IkIyTbQ1kUcezN16Uw0hZtt1JrWMKjY2SlgO3WsA4nMBCKqFf1MZcs6uZ75-6kfb7g3w4K55XByJMDHT3BuV4bx6dRGPYa8FP0mLl54Ua5Z%7EF6KnwpRkhW6qyaxfl0f1Veo7AHOCIJ5DEChZrUcAlHYjX7jQC82NxSZ2pVoLnvljpqeMKS4yO02MBKwttEbklSD5LZ0lKTvCgGNqwslLq5wQTwSw3ZM6dlY%7Ee5DM5GJO9%7EhBK5EtsBB9dAVUwlCGHhc-kgUtLfAxH5riXL2LhTHkIMgij3IxCAQy5ENw__&Key-Pair-Id=K24J24Z295AEI9\n", + "Resolving cdn-lfs-us-1.hf.co (cdn-lfs-us-1.hf.co)... 18.173.121.3, 18.173.121.32, 18.173.121.63, ...\n", + "Connecting to cdn-lfs-us-1.hf.co (cdn-lfs-us-1.hf.co)|18.173.121.3|:443... connected.\n", + "HTTP request sent, awaiting response... 200 OK\n", + "Length: 2176 (2.1K) [binary/octet-stream]\n", + "Saving to: ‘negative_prompt.npy’\n", + "\n", + "negative_prompt.npy 100%[===================>] 2.12K --.-KB/s in 0s \n", + "\n", + "2025-05-01 23:04:19 (1.16 GB/s) - ‘negative_prompt.npy’ saved [2176/2176]\n", + "\n", + "/content/DiffRhythm-hf\n", + "2025-05-01 23:04:38.694335: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:477] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n", + "WARNING: All log messages before absl::InitializeLog() is called are written to STDERR\n", + "E0000 00:00:1746140678.914141 3153 cuda_dnn.cc:8310] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n", + "E0000 00:00:1746140678.974799 3153 cuda_blas.cc:1418] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n", + "2025-05-01 23:04:39.465085: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n", + "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n", + "cfm_model.pt: 100% 2.22G/2.22G [00:17<00:00, 126MB/s]\n" + ] + } + ], + "source": [ + "%cd /content\n", + "!git clone -b dev https://github.com/camenduru/DiffRhythm-hf\n", + "!apt install espeak-ng\n", + "!pip install numpy==2.0 gradio muq mutagen torchdiffeq x-transformers pyopenjtalk pykakasi cn2an pypinyin onnxruntime unidecode phonemizer LangSegment\n", + "\n", + "%cd /content/DiffRhythm-hf/diffrhythm/g2p/sources/g2p_chinese_model\n", + "!wget https://huggingface.co/spaces/ASLP-lab/DiffRhythm/resolve/main/diffrhythm/g2p/sources/g2p_chinese_model/poly_bert_model.onnx\n", + "%cd /content/DiffRhythm-hf/src\n", + "!wget https://huggingface.co/spaces/ASLP-lab/DiffRhythm/resolve/main/src/negative_prompt.npy\n", + "%cd /content/DiffRhythm-hf\n", + "\n", + "!python app.py" + ] + } + ], + "metadata": { + "accelerator": "GPU", + "colab": { + "gpuType": "T4", + "provenance": [], + "include_colab_link": true + }, + "kernelspec": { + "display_name": "Python 3", + "name": "python3" + }, + "language_info": { + "name": "python" + } + }, + "nbformat": 4, + "nbformat_minor": 0 +} \ No newline at end of file