deunaDm commited on
Commit
12ac5fa
·
verified ·
1 Parent(s): abb615b

Upload 9 files

Browse files
Files changed (9) hide show
  1. .gitignore +173 -0
  2. .gitmodules +3 -0
  3. .pre-commit-config.yaml +14 -0
  4. Dockerfile +24 -0
  5. LICENSE +21 -0
  6. README.md +153 -0
  7. Spanish_F5.ipynb +433 -0
  8. pyproject.toml +62 -0
  9. ruff.toml +10 -0
.gitignore ADDED
@@ -0,0 +1,173 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Customed
2
+ .vscode/
3
+ tests/
4
+ runs/
5
+ data/
6
+ ckpts/
7
+ wandb/
8
+ results/
9
+
10
+
11
+
12
+ # Byte-compiled / optimized / DLL files
13
+ __pycache__/
14
+ *.py[cod]
15
+ *$py.class
16
+
17
+ # C extensions
18
+ *.so
19
+
20
+ # Distribution / packaging
21
+ .Python
22
+ build/
23
+ develop-eggs/
24
+ dist/
25
+ downloads/
26
+ eggs/
27
+ .eggs/
28
+ lib/
29
+ lib64/
30
+ parts/
31
+ sdist/
32
+ var/
33
+ wheels/
34
+ share/python-wheels/
35
+ *.egg-info/
36
+ .installed.cfg
37
+ *.egg
38
+ MANIFEST
39
+
40
+ # PyInstaller
41
+ # Usually these files are written by a python script from a template
42
+ # before PyInstaller builds the exe, so as to inject date/other infos into it.
43
+ *.manifest
44
+ *.spec
45
+
46
+ # Installer logs
47
+ pip-log.txt
48
+ pip-delete-this-directory.txt
49
+
50
+ # Unit test / coverage reports
51
+ htmlcov/
52
+ .tox/
53
+ .nox/
54
+ .coverage
55
+ .coverage.*
56
+ .cache
57
+ nosetests.xml
58
+ coverage.xml
59
+ *.cover
60
+ *.py,cover
61
+ .hypothesis/
62
+ .pytest_cache/
63
+ cover/
64
+
65
+ # Translations
66
+ *.mo
67
+ *.pot
68
+
69
+ # Django stuff:
70
+ *.log
71
+ local_settings.py
72
+ db.sqlite3
73
+ db.sqlite3-journal
74
+
75
+ # Flask stuff:
76
+ instance/
77
+ .webassets-cache
78
+
79
+ # Scrapy stuff:
80
+ .scrapy
81
+
82
+ # Sphinx documentation
83
+ docs/_build/
84
+
85
+ # PyBuilder
86
+ .pybuilder/
87
+ target/
88
+
89
+ # Jupyter Notebook
90
+ .ipynb_checkpoints
91
+
92
+ # IPython
93
+ profile_default/
94
+ ipython_config.py
95
+
96
+ # pyenv
97
+ # For a library or package, you might want to ignore these files since the code is
98
+ # intended to run in multiple environments; otherwise, check them in:
99
+ # .python-version
100
+
101
+ # pipenv
102
+ # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
103
+ # However, in case of collaboration, if having platform-specific dependencies or dependencies
104
+ # having no cross-platform support, pipenv may install dependencies that don't work, or not
105
+ # install all needed dependencies.
106
+ #Pipfile.lock
107
+
108
+ # poetry
109
+ # Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
110
+ # This is especially recommended for binary packages to ensure reproducibility, and is more
111
+ # commonly ignored for libraries.
112
+ # https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
113
+ #poetry.lock
114
+
115
+ # pdm
116
+ # Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
117
+ #pdm.lock
118
+ # pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
119
+ # in version control.
120
+ # https://pdm.fming.dev/latest/usage/project/#working-with-version-control
121
+ .pdm.toml
122
+ .pdm-python
123
+ .pdm-build/
124
+
125
+ # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
126
+ __pypackages__/
127
+
128
+ # Celery stuff
129
+ celerybeat-schedule
130
+ celerybeat.pid
131
+
132
+ # SageMath parsed files
133
+ *.sage.py
134
+
135
+ # Environments
136
+ .env
137
+ .venv
138
+ env/
139
+ venv/
140
+ ENV/
141
+ env.bak/
142
+ venv.bak/
143
+
144
+ # Spyder project settings
145
+ .spyderproject
146
+ .spyproject
147
+
148
+ # Rope project settings
149
+ .ropeproject
150
+
151
+ # mkdocs documentation
152
+ /site
153
+
154
+ # mypy
155
+ .mypy_cache/
156
+ .dmypy.json
157
+ dmypy.json
158
+
159
+ # Pyre type checker
160
+ .pyre/
161
+
162
+ # pytype static type analyzer
163
+ .pytype/
164
+
165
+ # Cython debug symbols
166
+ cython_debug/
167
+
168
+ # PyCharm
169
+ # JetBrains specific template is maintained in a separate JetBrains.gitignore that can
170
+ # be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
171
+ # and can be added to the global gitignore or merged into this file. For a more nuclear
172
+ # option (not recommended) you can uncomment the following to ignore the entire idea folder.
173
+ #.idea/
.gitmodules ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ [submodule "src/third_party/BigVGAN"]
2
+ path = src/third_party/BigVGAN
3
+ url = https://github.com/NVIDIA/BigVGAN.git
.pre-commit-config.yaml ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ repos:
2
+ - repo: https://github.com/astral-sh/ruff-pre-commit
3
+ # Ruff version.
4
+ rev: v0.7.0
5
+ hooks:
6
+ # Run the linter.
7
+ - id: ruff
8
+ args: [--fix]
9
+ # Run the formatter.
10
+ - id: ruff-format
11
+ - repo: https://github.com/pre-commit/pre-commit-hooks
12
+ rev: v2.3.0
13
+ hooks:
14
+ - id: check-yaml
Dockerfile ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM pytorch/pytorch:2.4.0-cuda12.4-cudnn9-devel
2
+
3
+ USER root
4
+
5
+ ARG DEBIAN_FRONTEND=noninteractive
6
+
7
+ LABEL github_repo="https://github.com/SWivid/F5-TTS"
8
+
9
+ RUN set -x \
10
+ && apt-get update \
11
+ && apt-get -y install wget curl man git less openssl libssl-dev unzip unar build-essential aria2 tmux vim \
12
+ && apt-get install -y openssh-server sox libsox-fmt-all libsox-fmt-mp3 libsndfile1-dev ffmpeg \
13
+ && rm -rf /var/lib/apt/lists/* \
14
+ && apt-get clean
15
+
16
+ WORKDIR /workspace
17
+
18
+ RUN git clone https://github.com/SWivid/F5-TTS.git \
19
+ && cd F5-TTS \
20
+ && pip install -e .[eval]
21
+
22
+ ENV SHELL=/bin/bash
23
+
24
+ WORKDIR /workspace/F5-TTS
LICENSE ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ MIT License
2
+
3
+ Copyright (c) 2024 Yushen CHEN
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
README.md CHANGED
@@ -0,0 +1,153 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching
2
+
3
+ **F5-TTS**: Diffusion Transformer with ConvNeXt V2, faster trained and inference.
4
+
5
+ **E2 TTS**: Flat-UNet Transformer, closest reproduction from [paper](https://arxiv.org/abs/2406.18009).
6
+
7
+ **Sway Sampling**: Inference-time flow step sampling strategy, greatly improves performance
8
+
9
+ ### Thanks to all the contributors !
10
+
11
+ ## News
12
+ Spanish model: https://huggingface.co/jpgallegoar/F5-Spanish/
13
+
14
+ ## Installation
15
+
16
+ ```bash
17
+ # Create a python 3.10 conda env (you could also use virtualenv)
18
+ conda create -n f5-tts python=3.10
19
+ conda activate f5-tts
20
+
21
+ # Install pytorch with your CUDA version, e.g.
22
+ pip install torch==2.3.0+cu118 torchaudio==2.3.0+cu118 --extra-index-url https://download.pytorch.org/whl/cu118
23
+ ```
24
+
25
+ Then you can choose from a few options below:
26
+
27
+ ### 1. As a pip package (if just for inference)
28
+
29
+ ```bash
30
+ pip install git+https://github.com/jpgallegoar/Spanish-F5.git
31
+ ```
32
+
33
+ ### 2. Local editable (if also do training, finetuning)
34
+
35
+ ```bash
36
+ git clone https://github.com/jpgallegoar/Spanish-F5.git
37
+ cd F5-TTS
38
+ # git submodule update --init --recursive # (optional, if need bigvgan)
39
+ pip install -e .
40
+ ```
41
+ If initialize submodule, you should add the following code at the beginning of `src/third_party/BigVGAN/bigvgan.py`.
42
+ ```python
43
+ import os
44
+ import sys
45
+ sys.path.append(os.path.dirname(os.path.abspath(__file__)))
46
+ ```
47
+
48
+ ## Inference
49
+
50
+ ### 1. Gradio App
51
+
52
+ Currently supported features:
53
+
54
+ - Basic TTS with Chunk Inference
55
+ - Multi-Style / Multi-Speaker Generation
56
+ - Voice Chat powered by Qwen2.5-3B-Instruct
57
+
58
+ ```bash
59
+ # Launch a Gradio app (web interface)
60
+ f5-tts_infer-gradio
61
+
62
+ # Specify the port/host
63
+ f5-tts_infer-gradio --port 7860 --host 0.0.0.0
64
+
65
+ # Launch a share link
66
+ f5-tts_infer-gradio --share
67
+ ```
68
+
69
+ ### 2. CLI Inference
70
+
71
+ ```bash
72
+ # Run with flags
73
+ # Leave --ref_text "" will have ASR model transcribe (extra GPU memory usage)
74
+ f5-tts_infer-cli \
75
+ --model "F5-TTS" \
76
+ --ref_audio "ref_audio.wav" \
77
+ --ref_text "The content, subtitle or transcription of reference audio." \
78
+ --gen_text "Some text you want TTS model generate for you."
79
+
80
+ # Run with default setting. src/f5_tts/infer/examples/basic/basic.toml
81
+ f5-tts_infer-cli
82
+ # Or with your own .toml file
83
+ f5-tts_infer-cli -c custom.toml
84
+
85
+ # Multi voice. See src/f5_tts/infer/README.md
86
+ f5-tts_infer-cli -c src/f5_tts/infer/examples/multi/story.toml
87
+ ```
88
+
89
+ ### 3. More instructions
90
+
91
+ - In order to have better generation results, take a moment to read [detailed guidance](src/f5_tts/infer).
92
+ - The [Issues](https://github.com/SWivid/F5-TTS/issues?q=is%3Aissue) are very useful, please try to find the solution by properly searching the keywords of problem encountered. If no answer found, then feel free to open an issue.
93
+
94
+
95
+ ## Training
96
+
97
+ ### 1. Gradio App
98
+
99
+ Read [training & finetuning guidance](src/f5_tts/train) for more instructions.
100
+
101
+ ```bash
102
+ # Quick start with Gradio web interface
103
+ f5-tts_finetune-gradio
104
+ ```
105
+
106
+
107
+ ## [Evaluation](src/f5_tts/eval)
108
+
109
+
110
+ ## Development
111
+
112
+ Use pre-commit to ensure code quality (will run linters and formatters automatically)
113
+
114
+ ```bash
115
+ pip install pre-commit
116
+ pre-commit install
117
+ ```
118
+
119
+ When making a pull request, before each commit, run:
120
+
121
+ ```bash
122
+ pre-commit run --all-files
123
+ ```
124
+
125
+ Note: Some model components have linting exceptions for E722 to accommodate tensor notation
126
+
127
+
128
+ ## Acknowledgements
129
+
130
+ - [E2-TTS](https://arxiv.org/abs/2406.18009) brilliant work, simple and effective
131
+ - [Emilia](https://arxiv.org/abs/2407.05361), [WenetSpeech4TTS](https://arxiv.org/abs/2406.05763) valuable datasets
132
+ - [lucidrains](https://github.com/lucidrains) initial CFM structure with also [bfs18](https://github.com/bfs18) for discussion
133
+ - [SD3](https://arxiv.org/abs/2403.03206) & [Hugging Face diffusers](https://github.com/huggingface/diffusers) DiT and MMDiT code structure
134
+ - [torchdiffeq](https://github.com/rtqichen/torchdiffeq) as ODE solver, [Vocos](https://huggingface.co/charactr/vocos-mel-24khz) as vocoder
135
+ - [FunASR](https://github.com/modelscope/FunASR), [faster-whisper](https://github.com/SYSTRAN/faster-whisper), [UniSpeech](https://github.com/microsoft/UniSpeech) for evaluation tools
136
+ - [ctc-forced-aligner](https://github.com/MahmoudAshraf97/ctc-forced-aligner) for speech edit test
137
+ - [mrfakename](https://x.com/realmrfakename) huggingface space demo ~
138
+ - [f5-tts-mlx](https://github.com/lucasnewman/f5-tts-mlx/tree/main) Implementation with MLX framework by [Lucas Newman](https://github.com/lucasnewman)
139
+ - [F5-TTS-ONNX](https://github.com/DakeQQ/F5-TTS-ONNX) ONNX Runtime version by [DakeQQ](https://github.com/DakeQQ)
140
+
141
+ ## Citation
142
+ If our work and codebase is useful for you, please cite as:
143
+ ```
144
+ @article{chen-etal-2024-f5tts,
145
+ title={F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching},
146
+ author={Yushen Chen and Zhikang Niu and Ziyang Ma and Keqi Deng and Chunhui Wang and Jian Zhao and Kai Yu and Xie Chen},
147
+ journal={arXiv preprint arXiv:2410.06885},
148
+ year={2024},
149
+ }
150
+ ```
151
+ ## License
152
+
153
+ Our code is released under MIT License. The pre-trained models are licensed under the CC-BY-NC license due to the training data Emilia, which is an in-the-wild dataset. Sorry for any inconvenience this may cause.
Spanish_F5.ipynb ADDED
@@ -0,0 +1,433 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "nbformat": 4,
3
+ "nbformat_minor": 0,
4
+ "metadata": {
5
+ "colab": {
6
+ "provenance": []
7
+ },
8
+ "kernelspec": {
9
+ "name": "python3",
10
+ "display_name": "Python 3"
11
+ },
12
+ "language_info": {
13
+ "name": "python"
14
+ }
15
+ },
16
+ "cells": [
17
+ {
18
+ "cell_type": "code",
19
+ "execution_count": 1,
20
+ "metadata": {
21
+ "colab": {
22
+ "base_uri": "https://localhost:8080/"
23
+ },
24
+ "id": "0-duLUr_Iema",
25
+ "outputId": "615d30a6-2a04-4859-ad9d-79edd6a3ffc1"
26
+ },
27
+ "outputs": [
28
+ {
29
+ "output_type": "stream",
30
+ "name": "stdout",
31
+ "text": [
32
+ "Collecting git+https://github.com/jpgallegoar/Spanish-F5.git\n",
33
+ " Cloning https://github.com/jpgallegoar/Spanish-F5.git to /tmp/pip-req-build-mupnta95\n",
34
+ " Running command git clone --filter=blob:none --quiet https://github.com/jpgallegoar/Spanish-F5.git /tmp/pip-req-build-mupnta95\n",
35
+ " Resolved https://github.com/jpgallegoar/Spanish-F5.git to commit 840d95016e3dd838ee3e7bbe30c64fdced73a7ef\n",
36
+ " Running command git submodule update --init --recursive -q\n",
37
+ " Installing build dependencies ... \u001b[?25l\u001b[?25hdone\n",
38
+ " Getting requirements to build wheel ... \u001b[?25l\u001b[?25hdone\n",
39
+ " Preparing metadata (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
40
+ "Requirement already satisfied: accelerate>=0.33.0 in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (0.34.2)\n",
41
+ "Collecting bitsandbytes>0.37.0 (from f5-tts==0.0.0)\n",
42
+ " Downloading bitsandbytes-0.44.1-py3-none-manylinux_2_24_x86_64.whl.metadata (3.5 kB)\n",
43
+ "Collecting cached-path (from f5-tts==0.0.0)\n",
44
+ " Downloading cached_path-1.6.3-py3-none-any.whl.metadata (19 kB)\n",
45
+ "Requirement already satisfied: click in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (8.1.7)\n",
46
+ "Collecting datasets (from f5-tts==0.0.0)\n",
47
+ " Downloading datasets-3.1.0-py3-none-any.whl.metadata (20 kB)\n",
48
+ "Collecting ema-pytorch>=0.5.2 (from f5-tts==0.0.0)\n",
49
+ " Downloading ema_pytorch-0.7.3-py3-none-any.whl.metadata (691 bytes)\n",
50
+ "Collecting gradio>=3.45.2 (from f5-tts==0.0.0)\n",
51
+ " Downloading gradio-5.4.0-py3-none-any.whl.metadata (16 kB)\n",
52
+ "Requirement already satisfied: jieba in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (0.42.1)\n",
53
+ "Requirement already satisfied: librosa in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (0.10.2.post1)\n",
54
+ "Requirement already satisfied: matplotlib in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (3.8.0)\n",
55
+ "Requirement already satisfied: numpy<=1.26.4 in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (1.26.4)\n",
56
+ "Collecting pydub (from f5-tts==0.0.0)\n",
57
+ " Downloading pydub-0.25.1-py2.py3-none-any.whl.metadata (1.4 kB)\n",
58
+ "Collecting pypinyin (from f5-tts==0.0.0)\n",
59
+ " Downloading pypinyin-0.53.0-py2.py3-none-any.whl.metadata (12 kB)\n",
60
+ "Requirement already satisfied: safetensors in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (0.4.5)\n",
61
+ "Requirement already satisfied: soundfile in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (0.12.1)\n",
62
+ "Requirement already satisfied: tomli in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (2.0.2)\n",
63
+ "Requirement already satisfied: torch>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (2.5.0+cu121)\n",
64
+ "Requirement already satisfied: torchaudio>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (2.5.0+cu121)\n",
65
+ "Collecting torchdiffeq (from f5-tts==0.0.0)\n",
66
+ " Downloading torchdiffeq-0.2.4-py3-none-any.whl.metadata (440 bytes)\n",
67
+ "Requirement already satisfied: tqdm>=4.65.0 in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (4.66.6)\n",
68
+ "Requirement already satisfied: transformers in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (4.44.2)\n",
69
+ "Collecting transformers-stream-generator (from f5-tts==0.0.0)\n",
70
+ " Downloading transformers-stream-generator-0.0.5.tar.gz (13 kB)\n",
71
+ " Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
72
+ "Collecting vocos (from f5-tts==0.0.0)\n",
73
+ " Downloading vocos-0.1.0-py3-none-any.whl.metadata (4.8 kB)\n",
74
+ "Requirement already satisfied: wandb in /usr/local/lib/python3.10/dist-packages (from f5-tts==0.0.0) (0.18.5)\n",
75
+ "Collecting x-transformers>=1.31.14 (from f5-tts==0.0.0)\n",
76
+ " Downloading x_transformers-1.42.5-py3-none-any.whl.metadata (689 bytes)\n",
77
+ "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.33.0->f5-tts==0.0.0) (24.1)\n",
78
+ "Requirement already satisfied: psutil in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.33.0->f5-tts==0.0.0) (5.9.5)\n",
79
+ "Requirement already satisfied: pyyaml in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.33.0->f5-tts==0.0.0) (6.0.2)\n",
80
+ "Requirement already satisfied: huggingface-hub>=0.21.0 in /usr/local/lib/python3.10/dist-packages (from accelerate>=0.33.0->f5-tts==0.0.0) (0.24.7)\n",
81
+ "Collecting aiofiles<24.0,>=22.0 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
82
+ " Downloading aiofiles-23.2.1-py3-none-any.whl.metadata (9.7 kB)\n",
83
+ "Requirement already satisfied: anyio<5.0,>=3.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (3.7.1)\n",
84
+ "Collecting fastapi<1.0,>=0.115.2 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
85
+ " Downloading fastapi-0.115.4-py3-none-any.whl.metadata (27 kB)\n",
86
+ "Collecting ffmpy (from gradio>=3.45.2->f5-tts==0.0.0)\n",
87
+ " Downloading ffmpy-0.4.0-py3-none-any.whl.metadata (2.9 kB)\n",
88
+ "Collecting gradio-client==1.4.2 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
89
+ " Downloading gradio_client-1.4.2-py3-none-any.whl.metadata (7.1 kB)\n",
90
+ "Requirement already satisfied: httpx>=0.24.1 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (0.27.2)\n",
91
+ "Collecting huggingface-hub>=0.21.0 (from accelerate>=0.33.0->f5-tts==0.0.0)\n",
92
+ " Downloading huggingface_hub-0.26.2-py3-none-any.whl.metadata (13 kB)\n",
93
+ "Requirement already satisfied: jinja2<4.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (3.1.4)\n",
94
+ "Collecting markupsafe~=2.0 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
95
+ " Downloading MarkupSafe-2.1.5-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (3.0 kB)\n",
96
+ "Requirement already satisfied: orjson~=3.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (3.10.10)\n",
97
+ "Requirement already satisfied: pandas<3.0,>=1.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (2.2.2)\n",
98
+ "Requirement already satisfied: pillow<12.0,>=8.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (10.4.0)\n",
99
+ "Requirement already satisfied: pydantic>=2.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (2.9.2)\n",
100
+ "Collecting python-multipart==0.0.12 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
101
+ " Downloading python_multipart-0.0.12-py3-none-any.whl.metadata (1.9 kB)\n",
102
+ "Collecting ruff>=0.2.2 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
103
+ " Downloading ruff-0.7.2-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (25 kB)\n",
104
+ "Collecting safehttpx<1.0,>=0.1.1 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
105
+ " Downloading safehttpx-0.1.1-py3-none-any.whl.metadata (4.1 kB)\n",
106
+ "Collecting semantic-version~=2.0 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
107
+ " Downloading semantic_version-2.10.0-py2.py3-none-any.whl.metadata (9.7 kB)\n",
108
+ "Collecting starlette<1.0,>=0.40.0 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
109
+ " Downloading starlette-0.41.2-py3-none-any.whl.metadata (6.0 kB)\n",
110
+ "Collecting tomlkit==0.12.0 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
111
+ " Downloading tomlkit-0.12.0-py3-none-any.whl.metadata (2.7 kB)\n",
112
+ "Requirement already satisfied: typer<1.0,>=0.12 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (0.12.5)\n",
113
+ "Requirement already satisfied: typing-extensions~=4.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (4.12.2)\n",
114
+ "Collecting uvicorn>=0.14.0 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
115
+ " Downloading uvicorn-0.32.0-py3-none-any.whl.metadata (6.6 kB)\n",
116
+ "Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from gradio-client==1.4.2->gradio>=3.45.2->f5-tts==0.0.0) (2024.10.0)\n",
117
+ "Collecting websockets<13.0,>=10.0 (from gradio-client==1.4.2->gradio>=3.45.2->f5-tts==0.0.0)\n",
118
+ " Downloading websockets-12.0-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (6.6 kB)\n",
119
+ "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from torch>=2.0.0->f5-tts==0.0.0) (3.16.1)\n",
120
+ "Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch>=2.0.0->f5-tts==0.0.0) (3.4.2)\n",
121
+ "Requirement already satisfied: sympy==1.13.1 in /usr/local/lib/python3.10/dist-packages (from torch>=2.0.0->f5-tts==0.0.0) (1.13.1)\n",
122
+ "Requirement already satisfied: mpmath<1.4,>=1.1.0 in /usr/local/lib/python3.10/dist-packages (from sympy==1.13.1->torch>=2.0.0->f5-tts==0.0.0) (1.3.0)\n",
123
+ "Collecting einx>=0.3.0 (from x-transformers>=1.31.14->f5-tts==0.0.0)\n",
124
+ " Downloading einx-0.3.0-py3-none-any.whl.metadata (6.9 kB)\n",
125
+ "Requirement already satisfied: einops>=0.8.0 in /usr/local/lib/python3.10/dist-packages (from x-transformers>=1.31.14->f5-tts==0.0.0) (0.8.0)\n",
126
+ "Requirement already satisfied: requests<3.0,>=2.0 in /usr/local/lib/python3.10/dist-packages (from cached-path->f5-tts==0.0.0) (2.32.3)\n",
127
+ "Requirement already satisfied: rich<14.0,>=12.1 in /usr/local/lib/python3.10/dist-packages (from cached-path->f5-tts==0.0.0) (13.9.3)\n",
128
+ "Collecting filelock (from torch>=2.0.0->f5-tts==0.0.0)\n",
129
+ " Downloading filelock-3.13.4-py3-none-any.whl.metadata (2.8 kB)\n",
130
+ "Collecting boto3<2.0,>=1.0 (from cached-path->f5-tts==0.0.0)\n",
131
+ " Downloading boto3-1.35.54-py3-none-any.whl.metadata (6.7 kB)\n",
132
+ "Requirement already satisfied: google-cloud-storage<3.0,>=1.32.0 in /usr/local/lib/python3.10/dist-packages (from cached-path->f5-tts==0.0.0) (2.8.0)\n",
133
+ "INFO: pip is looking at multiple versions of cached-path to determine which version is compatible with other requirements. This could take a while.\n",
134
+ "Collecting cached-path (from f5-tts==0.0.0)\n",
135
+ " Downloading cached_path-1.6.2-py3-none-any.whl.metadata (19 kB)\n",
136
+ " Downloading cached_path-1.6.0-py3-none-any.whl.metadata (19 kB)\n",
137
+ " Downloading cached_path-1.5.1-py3-none-any.whl.metadata (19 kB)\n",
138
+ "Collecting filelock (from torch>=2.0.0->f5-tts==0.0.0)\n",
139
+ " Downloading filelock-3.12.4-py3-none-any.whl.metadata (2.8 kB)\n",
140
+ "Collecting cached-path (from f5-tts==0.0.0)\n",
141
+ " Downloading cached_path-1.5.0-py3-none-any.whl.metadata (19 kB)\n",
142
+ " Downloading cached_path-1.4.0-py3-none-any.whl.metadata (6.3 kB)\n",
143
+ " Downloading cached_path-1.3.5-py3-none-any.whl.metadata (6.3 kB)\n",
144
+ " Downloading cached_path-1.3.4-py3-none-any.whl.metadata (6.3 kB)\n",
145
+ "Collecting filelock (from torch>=2.0.0->f5-tts==0.0.0)\n",
146
+ " Downloading filelock-3.9.1-py3-none-any.whl.metadata (2.4 kB)\n",
147
+ "INFO: pip is still looking at multiple versions of cached-path to determine which version is compatible with other requirements. This could take a while.\n",
148
+ "Collecting cached-path (from f5-tts==0.0.0)\n",
149
+ " Downloading cached_path-1.3.3-py3-none-any.whl.metadata (6.3 kB)\n",
150
+ " Downloading cached_path-1.3.2-py3-none-any.whl.metadata (6.3 kB)\n",
151
+ " Downloading cached_path-1.3.1-py3-none-any.whl.metadata (6.3 kB)\n",
152
+ " Downloading cached_path-1.3.0-py3-none-any.whl.metadata (6.3 kB)\n",
153
+ " Downloading cached_path-1.2.0-py3-none-any.whl.metadata (6.0 kB)\n",
154
+ "INFO: This is taking longer than usual. You might need to provide the dependency resolver with stricter constraints to reduce runtime. See https://pip.pypa.io/warnings/backtracking for guidance. If you want to abort this run, press Ctrl + C.\n",
155
+ " Downloading cached_path-1.1.6-py3-none-any.whl.metadata (6.0 kB)\n",
156
+ "Collecting rich<13.0,>=12.1 (from cached-path->f5-tts==0.0.0)\n",
157
+ " Downloading rich-12.6.0-py3-none-any.whl.metadata (18 kB)\n",
158
+ "Collecting filelock (from torch>=2.0.0->f5-tts==0.0.0)\n",
159
+ " Downloading filelock-3.8.2-py3-none-any.whl.metadata (2.3 kB)\n",
160
+ "Collecting cached-path (from f5-tts==0.0.0)\n",
161
+ " Downloading cached_path-1.1.5-py3-none-any.whl.metadata (6.0 kB)\n",
162
+ "Collecting filelock (from torch>=2.0.0->f5-tts==0.0.0)\n",
163
+ " Downloading filelock-3.7.1-py3-none-any.whl.metadata (2.5 kB)\n",
164
+ "Collecting cached-path (from f5-tts==0.0.0)\n",
165
+ " Downloading cached_path-1.1.4-py3-none-any.whl.metadata (6.0 kB)\n",
166
+ " Downloading cached_path-1.1.3-py3-none-any.whl.metadata (6.0 kB)\n",
167
+ " Downloading cached_path-1.1.2-py3-none-any.whl.metadata (6.0 kB)\n",
168
+ " Downloading cached_path-1.1.1-py3-none-any.whl.metadata (6.0 kB)\n",
169
+ " Downloading cached_path-1.1.0-py3-none-any.whl.metadata (6.0 kB)\n",
170
+ " Downloading cached_path-1.0.2-py3-none-any.whl.metadata (6.0 kB)\n",
171
+ " Downloading cached_path-1.0.1-py3-none-any.whl.metadata (5.9 kB)\n",
172
+ " Downloading cached_path-1.0.0-py3-none-any.whl.metadata (5.9 kB)\n",
173
+ " Downloading cached_path-0.3.4-py3-none-any.whl.metadata (6.0 kB)\n",
174
+ " Downloading cached_path-0.3.3-py3-none-any.whl.metadata (6.0 kB)\n",
175
+ " Downloading cached_path-0.3.2-py3-none-any.whl.metadata (6.0 kB)\n",
176
+ " Downloading cached_path-0.3.1-py3-none-any.whl.metadata (5.1 kB)\n",
177
+ " Downloading cached_path-0.3.0-py3-none-any.whl.metadata (4.1 kB)\n",
178
+ "Collecting google-cloud-storage<2.0,>=1.0 (from cached-path->f5-tts==0.0.0)\n",
179
+ " Downloading google_cloud_storage-1.44.0-py2.py3-none-any.whl.metadata (5.9 kB)\n",
180
+ "Collecting overrides<6.2,>=3.1 (from cached-path->f5-tts==0.0.0)\n",
181
+ " Downloading overrides-6.1.0-py3-none-any.whl.metadata (5.0 kB)\n",
182
+ "Collecting cached-path (from f5-tts==0.0.0)\n",
183
+ " Downloading cached_path-0.2.0-py3-none-any.whl.metadata (4.1 kB)\n",
184
+ " Downloading cached_path-0.1.0-py3-none-any.whl.metadata (3.4 kB)\n",
185
+ "Collecting overrides==3.1.0 (from cached-path->f5-tts==0.0.0)\n",
186
+ " Downloading overrides-3.1.0.tar.gz (11 kB)\n",
187
+ " Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
188
+ "Collecting gradio>=3.45.2 (from f5-tts==0.0.0)\n",
189
+ " Downloading gradio-5.3.0-py3-none-any.whl.metadata (15 kB)\n",
190
+ "Collecting python-multipart>=0.0.9 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
191
+ " Downloading python_multipart-0.0.17-py3-none-any.whl.metadata (1.8 kB)\n",
192
+ "Collecting gradio>=3.45.2 (from f5-tts==0.0.0)\n",
193
+ " Downloading gradio-5.1.0-py3-none-any.whl.metadata (15 kB)\n",
194
+ "Collecting gradio-client==1.4.0 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
195
+ " Downloading gradio_client-1.4.0-py3-none-any.whl.metadata (7.1 kB)\n",
196
+ "Collecting gradio>=3.45.2 (from f5-tts==0.0.0)\n",
197
+ " Downloading gradio-5.0.2-py3-none-any.whl.metadata (15 kB)\n",
198
+ " Downloading gradio-5.0.1-py3-none-any.whl.metadata (15 kB)\n",
199
+ " Downloading gradio-5.0.0-py3-none-any.whl.metadata (15 kB)\n",
200
+ " Downloading gradio-4.44.1-py3-none-any.whl.metadata (15 kB)\n",
201
+ "Collecting gradio-client==1.3.0 (from gradio>=3.45.2->f5-tts==0.0.0)\n",
202
+ " Downloading gradio_client-1.3.0-py3-none-any.whl.metadata (7.1 kB)\n",
203
+ "Requirement already satisfied: importlib-resources<7.0,>=1.3 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (6.4.5)\n",
204
+ "Requirement already satisfied: urllib3~=2.0 in /usr/local/lib/python3.10/dist-packages (from gradio>=3.45.2->f5-tts==0.0.0) (2.2.3)\n",
205
+ "Collecting huggingface-hub>=0.21.0 (from accelerate>=0.33.0->f5-tts==0.0.0)\n",
206
+ " Downloading huggingface_hub-0.23.5-py3-none-any.whl.metadata (12 kB)\n",
207
+ "Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->f5-tts==0.0.0) (1.3.0)\n",
208
+ "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib->f5-tts==0.0.0) (0.12.1)\n",
209
+ "Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib->f5-tts==0.0.0) (4.54.1)\n",
210
+ "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->f5-tts==0.0.0) (1.4.7)\n",
211
+ "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->f5-tts==0.0.0) (3.2.0)\n",
212
+ "Requirement already satisfied: python-dateutil>=2.7 in /usr/local/lib/python3.10/dist-packages (from matplotlib->f5-tts==0.0.0) (2.8.2)\n",
213
+ "Requirement already satisfied: pyarrow>=15.0.0 in /usr/local/lib/python3.10/dist-packages (from datasets->f5-tts==0.0.0) (17.0.0)\n",
214
+ "Collecting dill<0.3.9,>=0.3.0 (from datasets->f5-tts==0.0.0)\n",
215
+ " Downloading dill-0.3.8-py3-none-any.whl.metadata (10 kB)\n",
216
+ "Collecting xxhash (from datasets->f5-tts==0.0.0)\n",
217
+ " Downloading xxhash-3.5.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (12 kB)\n",
218
+ "Collecting multiprocess<0.70.17 (from datasets->f5-tts==0.0.0)\n",
219
+ " Downloading multiprocess-0.70.16-py310-none-any.whl.metadata (7.2 kB)\n",
220
+ "Collecting fsspec (from gradio-client==1.3.0->gradio>=3.45.2->f5-tts==0.0.0)\n",
221
+ " Downloading fsspec-2024.9.0-py3-none-any.whl.metadata (11 kB)\n",
222
+ "Requirement already satisfied: aiohttp in /usr/local/lib/python3.10/dist-packages (from datasets->f5-tts==0.0.0) (3.10.10)\n",
223
+ "Requirement already satisfied: audioread>=2.1.9 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (3.0.1)\n",
224
+ "Requirement already satisfied: scipy>=1.2.0 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (1.13.1)\n",
225
+ "Requirement already satisfied: scikit-learn>=0.20.0 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (1.5.2)\n",
226
+ "Requirement already satisfied: joblib>=0.14 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (1.4.2)\n",
227
+ "Requirement already satisfied: decorator>=4.3.0 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (4.4.2)\n",
228
+ "Requirement already satisfied: numba>=0.51.0 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (0.60.0)\n",
229
+ "Requirement already satisfied: pooch>=1.1 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (1.8.2)\n",
230
+ "Requirement already satisfied: soxr>=0.3.2 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (0.5.0.post1)\n",
231
+ "Requirement already satisfied: lazy-loader>=0.1 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (0.4)\n",
232
+ "Requirement already satisfied: msgpack>=1.0 in /usr/local/lib/python3.10/dist-packages (from librosa->f5-tts==0.0.0) (1.1.0)\n",
233
+ "Requirement already satisfied: cffi>=1.0 in /usr/local/lib/python3.10/dist-packages (from soundfile->f5-tts==0.0.0) (1.17.1)\n",
234
+ "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers->f5-tts==0.0.0) (2024.9.11)\n",
235
+ "Requirement already satisfied: tokenizers<0.20,>=0.19 in /usr/local/lib/python3.10/dist-packages (from transformers->f5-tts==0.0.0) (0.19.1)\n",
236
+ "Collecting encodec==0.1.1 (from vocos->f5-tts==0.0.0)\n",
237
+ " Downloading encodec-0.1.1.tar.gz (3.7 MB)\n",
238
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m3.7/3.7 MB\u001b[0m \u001b[31m32.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
239
+ "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
240
+ "Requirement already satisfied: docker-pycreds>=0.4.0 in /usr/local/lib/python3.10/dist-packages (from wandb->f5-tts==0.0.0) (0.4.0)\n",
241
+ "Requirement already satisfied: gitpython!=3.1.29,>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from wandb->f5-tts==0.0.0) (3.1.43)\n",
242
+ "Requirement already satisfied: platformdirs in /usr/local/lib/python3.10/dist-packages (from wandb->f5-tts==0.0.0) (4.3.6)\n",
243
+ "Requirement already satisfied: protobuf!=4.21.0,!=5.28.0,<6,>=3.19.0 in /usr/local/lib/python3.10/dist-packages (from wandb->f5-tts==0.0.0) (3.20.3)\n",
244
+ "Requirement already satisfied: sentry-sdk>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from wandb->f5-tts==0.0.0) (2.17.0)\n",
245
+ "Requirement already satisfied: setproctitle in /usr/local/lib/python3.10/dist-packages (from wandb->f5-tts==0.0.0) (1.3.3)\n",
246
+ "Requirement already satisfied: setuptools in /usr/local/lib/python3.10/dist-packages (from wandb->f5-tts==0.0.0) (75.1.0)\n",
247
+ "Requirement already satisfied: idna>=2.8 in /usr/local/lib/python3.10/dist-packages (from anyio<5.0,>=3.0->gradio>=3.45.2->f5-tts==0.0.0) (3.10)\n",
248
+ "Requirement already satisfied: sniffio>=1.1 in /usr/local/lib/python3.10/dist-packages (from anyio<5.0,>=3.0->gradio>=3.45.2->f5-tts==0.0.0) (1.3.1)\n",
249
+ "Requirement already satisfied: exceptiongroup in /usr/local/lib/python3.10/dist-packages (from anyio<5.0,>=3.0->gradio>=3.45.2->f5-tts==0.0.0) (1.2.2)\n",
250
+ "Collecting botocore<1.36.0,>=1.35.54 (from boto3<2.0,>=1.0->cached-path->f5-tts==0.0.0)\n",
251
+ " Downloading botocore-1.35.54-py3-none-any.whl.metadata (5.7 kB)\n",
252
+ "Collecting jmespath<2.0.0,>=0.7.1 (from boto3<2.0,>=1.0->cached-path->f5-tts==0.0.0)\n",
253
+ " Downloading jmespath-1.0.1-py3-none-any.whl.metadata (7.6 kB)\n",
254
+ "Collecting s3transfer<0.11.0,>=0.10.0 (from boto3<2.0,>=1.0->cached-path->f5-tts==0.0.0)\n",
255
+ " Downloading s3transfer-0.10.3-py3-none-any.whl.metadata (1.7 kB)\n",
256
+ "Requirement already satisfied: pycparser in /usr/local/lib/python3.10/dist-packages (from cffi>=1.0->soundfile->f5-tts==0.0.0) (2.22)\n",
257
+ "Requirement already satisfied: six>=1.4.0 in /usr/local/lib/python3.10/dist-packages (from docker-pycreds>=0.4.0->wandb->f5-tts==0.0.0) (1.16.0)\n",
258
+ "Requirement already satisfied: frozendict in /usr/local/lib/python3.10/dist-packages (from einx>=0.3.0->x-transformers>=1.31.14->f5-tts==0.0.0) (2.4.6)\n",
259
+ "Requirement already satisfied: aiohappyeyeballs>=2.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets->f5-tts==0.0.0) (2.4.3)\n",
260
+ "Requirement already satisfied: aiosignal>=1.1.2 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets->f5-tts==0.0.0) (1.3.1)\n",
261
+ "Requirement already satisfied: attrs>=17.3.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets->f5-tts==0.0.0) (24.2.0)\n",
262
+ "Requirement already satisfied: frozenlist>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets->f5-tts==0.0.0) (1.5.0)\n",
263
+ "Requirement already satisfied: multidict<7.0,>=4.5 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets->f5-tts==0.0.0) (6.1.0)\n",
264
+ "Requirement already satisfied: yarl<2.0,>=1.12.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets->f5-tts==0.0.0) (1.17.0)\n",
265
+ "Requirement already satisfied: async-timeout<5.0,>=4.0 in /usr/local/lib/python3.10/dist-packages (from aiohttp->datasets->f5-tts==0.0.0) (4.0.3)\n",
266
+ "Requirement already satisfied: gitdb<5,>=4.0.1 in /usr/local/lib/python3.10/dist-packages (from gitpython!=3.1.29,>=1.0.0->wandb->f5-tts==0.0.0) (4.0.11)\n",
267
+ "Requirement already satisfied: google-auth<3.0dev,>=1.25.0 in /usr/local/lib/python3.10/dist-packages (from google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (2.27.0)\n",
268
+ "Requirement already satisfied: google-api-core!=2.0.*,!=2.1.*,!=2.2.*,!=2.3.0,<3.0.0dev,>=1.31.5 in /usr/local/lib/python3.10/dist-packages (from google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (2.19.2)\n",
269
+ "Requirement already satisfied: google-cloud-core<3.0dev,>=2.3.0 in /usr/local/lib/python3.10/dist-packages (from google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (2.4.1)\n",
270
+ "Requirement already satisfied: google-resumable-media>=2.3.2 in /usr/local/lib/python3.10/dist-packages (from google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (2.7.2)\n",
271
+ "Requirement already satisfied: certifi in /usr/local/lib/python3.10/dist-packages (from httpx>=0.24.1->gradio>=3.45.2->f5-tts==0.0.0) (2024.8.30)\n",
272
+ "Requirement already satisfied: httpcore==1.* in /usr/local/lib/python3.10/dist-packages (from httpx>=0.24.1->gradio>=3.45.2->f5-tts==0.0.0) (1.0.6)\n",
273
+ "Requirement already satisfied: h11<0.15,>=0.13 in /usr/local/lib/python3.10/dist-packages (from httpcore==1.*->httpx>=0.24.1->gradio>=3.45.2->f5-tts==0.0.0) (0.14.0)\n",
274
+ "Requirement already satisfied: llvmlite<0.44,>=0.43.0dev0 in /usr/local/lib/python3.10/dist-packages (from numba>=0.51.0->librosa->f5-tts==0.0.0) (0.43.0)\n",
275
+ "Requirement already satisfied: pytz>=2020.1 in /usr/local/lib/python3.10/dist-packages (from pandas<3.0,>=1.0->gradio>=3.45.2->f5-tts==0.0.0) (2024.2)\n",
276
+ "Requirement already satisfied: tzdata>=2022.7 in /usr/local/lib/python3.10/dist-packages (from pandas<3.0,>=1.0->gradio>=3.45.2->f5-tts==0.0.0) (2024.2)\n",
277
+ "Requirement already satisfied: annotated-types>=0.6.0 in /usr/local/lib/python3.10/dist-packages (from pydantic>=2.0->gradio>=3.45.2->f5-tts==0.0.0) (0.7.0)\n",
278
+ "Requirement already satisfied: pydantic-core==2.23.4 in /usr/local/lib/python3.10/dist-packages (from pydantic>=2.0->gradio>=3.45.2->f5-tts==0.0.0) (2.23.4)\n",
279
+ "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests<3.0,>=2.0->cached-path->f5-tts==0.0.0) (3.4.0)\n",
280
+ "Requirement already satisfied: markdown-it-py>=2.2.0 in /usr/local/lib/python3.10/dist-packages (from rich<14.0,>=12.1->cached-path->f5-tts==0.0.0) (3.0.0)\n",
281
+ "Requirement already satisfied: pygments<3.0.0,>=2.13.0 in /usr/local/lib/python3.10/dist-packages (from rich<14.0,>=12.1->cached-path->f5-tts==0.0.0) (2.18.0)\n",
282
+ "Requirement already satisfied: threadpoolctl>=3.1.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=0.20.0->librosa->f5-tts==0.0.0) (3.5.0)\n",
283
+ "Requirement already satisfied: shellingham>=1.3.0 in /usr/local/lib/python3.10/dist-packages (from typer<1.0,>=0.12->gradio>=3.45.2->f5-tts==0.0.0) (1.5.4)\n",
284
+ "Requirement already satisfied: smmap<6,>=3.0.1 in /usr/local/lib/python3.10/dist-packages (from gitdb<5,>=4.0.1->gitpython!=3.1.29,>=1.0.0->wandb->f5-tts==0.0.0) (5.0.1)\n",
285
+ "Requirement already satisfied: googleapis-common-protos<2.0.dev0,>=1.56.2 in /usr/local/lib/python3.10/dist-packages (from google-api-core!=2.0.*,!=2.1.*,!=2.2.*,!=2.3.0,<3.0.0dev,>=1.31.5->google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (1.65.0)\n",
286
+ "Requirement already satisfied: proto-plus<2.0.0dev,>=1.22.3 in /usr/local/lib/python3.10/dist-packages (from google-api-core!=2.0.*,!=2.1.*,!=2.2.*,!=2.3.0,<3.0.0dev,>=1.31.5->google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (1.25.0)\n",
287
+ "Requirement already satisfied: cachetools<6.0,>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from google-auth<3.0dev,>=1.25.0->google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (5.5.0)\n",
288
+ "Requirement already satisfied: pyasn1-modules>=0.2.1 in /usr/local/lib/python3.10/dist-packages (from google-auth<3.0dev,>=1.25.0->google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (0.4.1)\n",
289
+ "Requirement already satisfied: rsa<5,>=3.1.4 in /usr/local/lib/python3.10/dist-packages (from google-auth<3.0dev,>=1.25.0->google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (4.9)\n",
290
+ "Requirement already satisfied: google-crc32c<2.0dev,>=1.0 in /usr/local/lib/python3.10/dist-packages (from google-resumable-media>=2.3.2->google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (1.6.0)\n",
291
+ "Requirement already satisfied: mdurl~=0.1 in /usr/local/lib/python3.10/dist-packages (from markdown-it-py>=2.2.0->rich<14.0,>=12.1->cached-path->f5-tts==0.0.0) (0.1.2)\n",
292
+ "Requirement already satisfied: propcache>=0.2.0 in /usr/local/lib/python3.10/dist-packages (from yarl<2.0,>=1.12.0->aiohttp->datasets->f5-tts==0.0.0) (0.2.0)\n",
293
+ "Requirement already satisfied: pyasn1<0.7.0,>=0.4.6 in /usr/local/lib/python3.10/dist-packages (from pyasn1-modules>=0.2.1->google-auth<3.0dev,>=1.25.0->google-cloud-storage<3.0,>=1.32.0->cached-path->f5-tts==0.0.0) (0.6.1)\n",
294
+ "Downloading bitsandbytes-0.44.1-py3-none-manylinux_2_24_x86_64.whl (122.4 MB)\n",
295
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m122.4/122.4 MB\u001b[0m \u001b[31m6.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
296
+ "\u001b[?25hDownloading ema_pytorch-0.7.3-py3-none-any.whl (9.6 kB)\n",
297
+ "Downloading gradio-4.44.1-py3-none-any.whl (18.1 MB)\n",
298
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m18.1/18.1 MB\u001b[0m \u001b[31m53.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
299
+ "\u001b[?25hDownloading gradio_client-1.3.0-py3-none-any.whl (318 kB)\n",
300
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m318.7/318.7 kB\u001b[0m \u001b[31m17.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
301
+ "\u001b[?25hDownloading tomlkit-0.12.0-py3-none-any.whl (37 kB)\n",
302
+ "Downloading cached_path-1.6.3-py3-none-any.whl (35 kB)\n",
303
+ "Downloading huggingface_hub-0.23.5-py3-none-any.whl (402 kB)\n",
304
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m402.8/402.8 kB\u001b[0m \u001b[31m20.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
305
+ "\u001b[?25hDownloading x_transformers-1.42.5-py3-none-any.whl (47 kB)\n",
306
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m47.5/47.5 kB\u001b[0m \u001b[31m3.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
307
+ "\u001b[?25hDownloading datasets-3.1.0-py3-none-any.whl (480 kB)\n",
308
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m480.6/480.6 kB\u001b[0m \u001b[31m23.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
309
+ "\u001b[?25hDownloading pydub-0.25.1-py2.py3-none-any.whl (32 kB)\n",
310
+ "Downloading pypinyin-0.53.0-py2.py3-none-any.whl (834 kB)\n",
311
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m834.7/834.7 kB\u001b[0m \u001b[31m32.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
312
+ "\u001b[?25hDownloading torchdiffeq-0.2.4-py3-none-any.whl (32 kB)\n",
313
+ "Downloading vocos-0.1.0-py3-none-any.whl (24 kB)\n",
314
+ "Downloading aiofiles-23.2.1-py3-none-any.whl (15 kB)\n",
315
+ "Downloading boto3-1.35.54-py3-none-any.whl (139 kB)\n",
316
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m139.2/139.2 kB\u001b[0m \u001b[31m9.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
317
+ "\u001b[?25hDownloading dill-0.3.8-py3-none-any.whl (116 kB)\n",
318
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m116.3/116.3 kB\u001b[0m \u001b[31m7.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
319
+ "\u001b[?25hDownloading einx-0.3.0-py3-none-any.whl (102 kB)\n",
320
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m103.0/103.0 kB\u001b[0m \u001b[31m5.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
321
+ "\u001b[?25hDownloading fastapi-0.115.4-py3-none-any.whl (94 kB)\n",
322
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m94.7/94.7 kB\u001b[0m \u001b[31m4.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
323
+ "\u001b[?25hDownloading filelock-3.13.4-py3-none-any.whl (11 kB)\n",
324
+ "Downloading fsspec-2024.9.0-py3-none-any.whl (179 kB)\n",
325
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m179.3/179.3 kB\u001b[0m \u001b[31m9.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
326
+ "\u001b[?25hDownloading MarkupSafe-2.1.5-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (25 kB)\n",
327
+ "Downloading multiprocess-0.70.16-py310-none-any.whl (134 kB)\n",
328
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m134.8/134.8 kB\u001b[0m \u001b[31m9.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
329
+ "\u001b[?25hDownloading python_multipart-0.0.17-py3-none-any.whl (24 kB)\n",
330
+ "Downloading ruff-0.7.2-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (11.0 MB)\n",
331
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m11.0/11.0 MB\u001b[0m \u001b[31m90.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
332
+ "\u001b[?25hDownloading semantic_version-2.10.0-py2.py3-none-any.whl (15 kB)\n",
333
+ "Downloading uvicorn-0.32.0-py3-none-any.whl (63 kB)\n",
334
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m63.7/63.7 kB\u001b[0m \u001b[31m4.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
335
+ "\u001b[?25hDownloading ffmpy-0.4.0-py3-none-any.whl (5.8 kB)\n",
336
+ "Downloading xxhash-3.5.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (194 kB)\n",
337
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m194.1/194.1 kB\u001b[0m \u001b[31m12.6 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
338
+ "\u001b[?25hDownloading botocore-1.35.54-py3-none-any.whl (12.7 MB)\n",
339
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m12.7/12.7 MB\u001b[0m \u001b[31m78.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
340
+ "\u001b[?25hDownloading jmespath-1.0.1-py3-none-any.whl (20 kB)\n",
341
+ "Downloading s3transfer-0.10.3-py3-none-any.whl (82 kB)\n",
342
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m82.6/82.6 kB\u001b[0m \u001b[31m5.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
343
+ "\u001b[?25hDownloading starlette-0.41.2-py3-none-any.whl (73 kB)\n",
344
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m73.3/73.3 kB\u001b[0m \u001b[31m5.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
345
+ "\u001b[?25hDownloading websockets-12.0-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl (130 kB)\n",
346
+ "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m130.2/130.2 kB\u001b[0m \u001b[31m6.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
347
+ "\u001b[?25hBuilding wheels for collected packages: f5-tts, transformers-stream-generator, encodec\n",
348
+ " Building wheel for f5-tts (pyproject.toml) ... \u001b[?25l\u001b[?25hdone\n",
349
+ " Created wheel for f5-tts: filename=f5_tts-0.0.0-py3-none-any.whl size=1280758 sha256=b900d02175b3eccb21dec0d1801d9bffc4fd30451509a67ef45a6f0653580c7c\n",
350
+ " Stored in directory: /tmp/pip-ephem-wheel-cache-3_lciyxv/wheels/63/43/c5/fb04687e74a83e9bc15bb575c33e53b6aca4bf7a2fb32982f2\n",
351
+ " Building wheel for transformers-stream-generator (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
352
+ " Created wheel for transformers-stream-generator: filename=transformers_stream_generator-0.0.5-py3-none-any.whl size=12425 sha256=0e9f6ab066ff4bcfa59962bd47464e4dc82ea27afed7086565aad6d86b0b6e5b\n",
353
+ " Stored in directory: /root/.cache/pip/wheels/95/4a/90/140f7b67d125906f6a165f38aad212ecb4a695ad0d87582437\n",
354
+ " Building wheel for encodec (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
355
+ " Created wheel for encodec: filename=encodec-0.1.1-py3-none-any.whl size=45760 sha256=bccc14b58f86cf341371dda33deedf0bd6ef90e06649662b5337eb0e9e785a92\n",
356
+ " Stored in directory: /root/.cache/pip/wheels/fc/36/cb/81af8b985a5f5e0815312d5e52b41263237af07b977e6bcbf3\n",
357
+ "Successfully built f5-tts transformers-stream-generator encodec\n",
358
+ "Installing collected packages: pydub, xxhash, websockets, uvicorn, tomlkit, semantic-version, ruff, python-multipart, pypinyin, markupsafe, jmespath, fsspec, filelock, ffmpy, dill, aiofiles, starlette, multiprocess, huggingface-hub, einx, botocore, s3transfer, gradio-client, fastapi, x-transformers, torchdiffeq, gradio, ema-pytorch, boto3, bitsandbytes, transformers-stream-generator, encodec, datasets, vocos, cached-path, f5-tts\n",
359
+ " Attempting uninstall: markupsafe\n",
360
+ " Found existing installation: MarkupSafe 3.0.2\n",
361
+ " Uninstalling MarkupSafe-3.0.2:\n",
362
+ " Successfully uninstalled MarkupSafe-3.0.2\n",
363
+ " Attempting uninstall: fsspec\n",
364
+ " Found existing installation: fsspec 2024.10.0\n",
365
+ " Uninstalling fsspec-2024.10.0:\n",
366
+ " Successfully uninstalled fsspec-2024.10.0\n",
367
+ " Attempting uninstall: filelock\n",
368
+ " Found existing installation: filelock 3.16.1\n",
369
+ " Uninstalling filelock-3.16.1:\n",
370
+ " Successfully uninstalled filelock-3.16.1\n",
371
+ " Attempting uninstall: huggingface-hub\n",
372
+ " Found existing installation: huggingface-hub 0.24.7\n",
373
+ " Uninstalling huggingface-hub-0.24.7:\n",
374
+ " Successfully uninstalled huggingface-hub-0.24.7\n",
375
+ "\u001b[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n",
376
+ "gcsfs 2024.10.0 requires fsspec==2024.10.0, but you have fsspec 2024.9.0 which is incompatible.\n",
377
+ "pytensor 2.25.5 requires filelock>=3.15, but you have filelock 3.13.4 which is incompatible.\u001b[0m\u001b[31m\n",
378
+ "\u001b[0mSuccessfully installed aiofiles-23.2.1 bitsandbytes-0.44.1 boto3-1.35.54 botocore-1.35.54 cached-path-1.6.3 datasets-3.1.0 dill-0.3.8 einx-0.3.0 ema-pytorch-0.7.3 encodec-0.1.1 f5-tts-0.0.0 fastapi-0.115.4 ffmpy-0.4.0 filelock-3.13.4 fsspec-2024.9.0 gradio-4.44.1 gradio-client-1.3.0 huggingface-hub-0.23.5 jmespath-1.0.1 markupsafe-2.1.5 multiprocess-0.70.16 pydub-0.25.1 pypinyin-0.53.0 python-multipart-0.0.17 ruff-0.7.2 s3transfer-0.10.3 semantic-version-2.10.0 starlette-0.41.2 tomlkit-0.12.0 torchdiffeq-0.2.4 transformers-stream-generator-0.0.5 uvicorn-0.32.0 vocos-0.1.0 websockets-12.0 x-transformers-1.42.5 xxhash-3.5.0\n"
379
+ ]
380
+ }
381
+ ],
382
+ "source": [
383
+ "pip install git+https://github.com/jpgallegoar/Spanish-F5.git"
384
+ ]
385
+ },
386
+ {
387
+ "cell_type": "code",
388
+ "source": [
389
+ "!f5-tts_infer-gradio"
390
+ ],
391
+ "metadata": {
392
+ "colab": {
393
+ "base_uri": "https://localhost:8080/"
394
+ },
395
+ "id": "a2LYVge6IhOh",
396
+ "outputId": "be4d8d64-c020-4c97-eb57-ed0ceced7fba"
397
+ },
398
+ "execution_count": null,
399
+ "outputs": [
400
+ {
401
+ "output_type": "stream",
402
+ "name": "stdout",
403
+ "text": [
404
+ "2024-11-04 17:05:51.302161: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:485] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n",
405
+ "2024-11-04 17:05:51.328444: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:8454] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n",
406
+ "2024-11-04 17:05:51.335942: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1452] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n",
407
+ "2024-11-04 17:05:51.354757: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
408
+ "To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
409
+ "2024-11-04 17:05:52.875946: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
410
+ "Download Vocos from huggingface charactr/vocos-mel-24khz\n",
411
+ "config.yaml: 100% 461/461 [00:00<00:00, 2.61MB/s]\n",
412
+ "pytorch_model.bin: 100% 54.4M/54.4M [00:00<00:00, 139MB/s]\n",
413
+ "/usr/local/lib/python3.10/dist-packages/vocos/pretrained.py:70: FutureWarning: You are using `torch.load` with `weights_only=False` (the current default value), which uses the default pickle module implicitly. It is possible to construct malicious pickle data which will execute arbitrary code during unpickling (See https://github.com/pytorch/pytorch/blob/main/SECURITY.md#untrusted-models for more details). In a future release, the default value for `weights_only` will be flipped to `True`. This limits the functions that could be executed during unpickling. Arbitrary objects will no longer be allowed to be loaded via this mode unless they are explicitly allowlisted by the user via `torch.serialization.add_safe_globals`. We recommend you start setting `weights_only=True` for any use case where you don't have full control of the loaded file. Please open an issue on GitHub for any issues related to this experimental feature.\n",
414
+ " state_dict = torch.load(model_path, map_location=\"cpu\")\n",
415
+ "model_1200000.safetensors: 100% 1.35G/1.35G [02:09<00:00, 10.4MB/s]\n",
416
+ "\n",
417
+ "vocab : /usr/local/lib/python3.10/dist-packages/f5_tts/infer/examples/vocab.txt\n",
418
+ "tokenizer : custom\n",
419
+ "model : /root/.cache/huggingface/hub/models--jpgallegoar--F5-Spanish/snapshots/120ddcfa7813b928325a787b9ad2bf038d2c32df/model_1200000.safetensors \n",
420
+ "\n",
421
+ "Starting app...\n",
422
+ "Running on local URL: http://127.0.0.1:7860\n",
423
+ "Running on public URL: https://dd1c9f211495273ff6.gradio.live\n",
424
+ "\n",
425
+ "This share link expires in 72 hours. For free permanent hosting and GPU upgrades, run `gradio deploy` from Terminal to deploy to Spaces (https://huggingface.co/spaces)\n",
426
+ "config.json: 100% 1.26k/1.26k [00:00<00:00, 1.89MB/s]\n",
427
+ "model.safetensors: 21% 336M/1.62G [00:32<02:03, 10.4MB/s]"
428
+ ]
429
+ }
430
+ ]
431
+ }
432
+ ]
433
+ }
pyproject.toml ADDED
@@ -0,0 +1,62 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [build-system]
2
+ requires = ["setuptools >= 61.0", "setuptools-scm>=8.0"]
3
+ build-backend = "setuptools.build_meta"
4
+
5
+ [project]
6
+ name = "f5-tts"
7
+ dynamic = ["version"]
8
+ description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching"
9
+ readme = "README.md"
10
+ license = {text = "MIT License"}
11
+ classifiers = [
12
+ "License :: OSI Approved :: MIT License",
13
+ "Operating System :: OS Independent",
14
+ "Programming Language :: Python :: 3",
15
+ ]
16
+ dependencies = [
17
+ "accelerate>=0.33.0",
18
+ "bitsandbytes==0.44.1",
19
+ "cached_path",
20
+ "click",
21
+ "datasets",
22
+ "ema_pytorch>=0.5.2",
23
+ "gradio>=3.45.2",
24
+ "jieba",
25
+ "librosa",
26
+ "matplotlib",
27
+ "numpy<=1.26.4",
28
+ "pydub",
29
+ "pypinyin",
30
+ "safetensors",
31
+ "soundfile",
32
+ "tomli",
33
+ "torch>=2.0.0",
34
+ "torchaudio>=2.0.0",
35
+ "torchdiffeq",
36
+ "tqdm>=4.65.0",
37
+ "transformers",
38
+ "transformers_stream_generator",
39
+ "vocos",
40
+ "wandb",
41
+ "x_transformers>=1.31.14",
42
+ "num2words",
43
+ ]
44
+
45
+ [project.optional-dependencies]
46
+ eval = [
47
+ "faster_whisper==0.10.1",
48
+ "funasr",
49
+ "jiwer",
50
+ "modelscope",
51
+ "zhconv",
52
+ "zhon",
53
+ ]
54
+
55
+ [project.urls]
56
+ Homepage = "https://github.com/SWivid/F5-TTS"
57
+
58
+ [project.scripts]
59
+ "f5-tts_infer-cli" = "f5_tts.infer.infer_cli:main"
60
+ "f5-tts_infer-gradio" = "f5_tts.infer.infer_gradio:main"
61
+ "f5-tts_finetune-cli" = "f5_tts.train.finetune_cli:main"
62
+ "f5-tts_finetune-gradio" = "f5_tts.train.finetune_gradio:main"
ruff.toml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ line-length = 120
2
+ target-version = "py310"
3
+
4
+ [lint]
5
+ # Only ignore variables with names starting with "_".
6
+ dummy-variable-rgx = "^_.*$"
7
+
8
+ [lint.isort]
9
+ force-single-line = true
10
+ lines-after-imports = 2