1 year ago · b6dd699bd6
--- a/ChatTTS/Dockerfile.cpu
+++ b/ChatTTS/Dockerfile.cpu
@@ -0,0 +1,7 @@
 
															+FROM pytorch/torchserve:0.11.0-cpu as builder
														
 
															+
														
 
															+WORKDIR /app
														
 
															+
														
 
															+COPY . ./
														
 
															+
														
 
															+RUN pip install -r requirements.txt -i https://pypi.tuna.tsinghua.edu.cn/simple
														
--- a/ChatTTS/README.md
+++ b/ChatTTS/README.md
@@ -0,0 +1,10 @@
 
															+# ChatTTS
														
 
															+
														
 
															+文本转语音
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+[2noise/ChatTTS: A generative speech model for daily dialogue.](https://github.com/2noise/ChatTTS)
														
 
															+
														
--- a/ChatTTS/docker-compose.cpu.yaml
+++ b/ChatTTS/docker-compose.cpu.yaml
@@ -0,0 +1,16 @@
 
															+services:
														
 
															+  chat-tts-ui:
														
 
															+    build:
														
 
															+      context: .
														
 
															+      dockerfile: Dockerfile.cpu
														
 
															+    container_name: chat-tts-ui
														
 
															+    restart: always
														
 
															+    volumes:
														
 
															+      - "./:/app"
														
 
															+    ports:
														
 
															+      - 9966:9966
														
 
															+    user: "${UID}:${GID}"
														
 
															+    environment:
														
 
															+      LOG_LEVEL: DEBUG
														
 
															+      WEB_ADDRESS: 0.0.0.0:9966
														
 
															+    command: python3 app.py
														
--- a/README.md
+++ b/README.md
@@ -1,2 +1,57 @@
 
															 # TTS
														
 
															+文字转语音，语音clone
														
 
															+
														
 
															+
														
 
															+
														
 
															+## XTTS
														
 
															+
														
 
															+
														
 
															+
														
 
															+## VoiceCraft2
														
 
															+
														
 
															+语音编辑和零样本文本转语音（TTS），包括有声书、互联网视频和播客。VoiceCraft只需要几秒钟的参考语音就能克隆声音。
														
 
															+
														
 
															+<https://github.dev/jasonppy/VoiceCraft>
														
 
															+
														
 
															+
														
 
															+
														
 
															+## ChatTTS
														
 
															+
														
 
															+<https://github.com/2noise/ChatTTS>
														
 
															+
														
 
															+[2Noise/ChatTTS · Hugging Face](https://huggingface.co/2Noise/ChatTTS)
														
 
															+
														
 
															+
														
 
															+
														
 
															+## TTS
														
 
															+
														
 
															+
														
 
															+
														
 
															+ <https://github.com/coqui-ai/TTS>
														
 
															+
														
 
															+
														
 
															+
														
 
															+## GPT-SoVITS
														
 
															+
														
 
															+
														
 
															+
														
 
															+[RVC-Boss/GPT-SoVITS: 1 min voice data can also be used to train a good TTS model! (few shot voice cloning)](https://github.com/RVC-Boss/GPT-SoVITS)
														
 
															+
														
 
															+
														
 
															+
														
 
															+[GPT-SoVITS · Studios](https://www.modelscope.cn/studios/xzjosh/GPT-SoVITS/)
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+
														
 
															+## Reference
														
 
															+
														
 
															+
														
 
															+
														
 
															+https://fish.audio/zh-CN/
														
 
															+
														
 
															+
														
 
															+
														
 
															+[ChatTTS: Text-to-Speech For Chat](https://chattts.com/)
														
--- a/VoiceCraft/README.md
+++ b/VoiceCraft/README.md
@@ -0,0 +1,67 @@
 
															+# VoiceCraft
														
 
															+语音编辑和零样本文本转语音（TTS），包括有声书、互联网视频和播客。VoiceCraft只需要几秒钟的参考语音就能克隆声音。
														
 
															+
														
 
															+## Usage
														
 
															+
														
 
															+项目：
														
 
															+https://github.com/jasonppy/VoiceCraft
														
 
															+
														
 
															+模型：
														
 
															+https://huggingface.co/pyp1/VoiceCraft/tree/main
														
 
															+
														
 
															+演示页面:
														
 
															+https://jasonppy.github.io/VoiceCraft_web/
														
 
															+
														
 
															+```
														
 
															+conda create -n voicecraft python=3.9.16
														
 
															+conda activate voicecraft
														
 
															+
														
 
															+pip install -e git+https://github.com/facebookresearch/audiocraft.git@c5157b5bf14bf83449c17ea1eeb66c19fb4bc7f0#egg=audiocraft
														
 
															+pip install xformers==0.0.22
														
 
															+pip install torchaudio==2.0.2 torch==2.0.1 # this assumes your system is compatible with CUDA 11.7, otherwise checkout https://pytorch.org/get-started/previous-versions/#v201
														
 
															+apt-get install ffmpeg # if you don't already have ffmpeg installed
														
 
															+apt-get install espeak-ng # backend for the phonemizer installed below
														
 
															+pip install tensorboard==2.16.2
														
 
															+pip install phonemizer==3.2.1
														
 
															+pip install datasets==2.16.0
														
 
															+pip install torchmetrics==0.11.1
														
 
															+# install MFA for getting forced-alignment, this could take a few minutes
														
 
															+conda install -c conda-forge montreal-forced-aligner=2.2.17 openfst=1.8.2 kaldi=5.5.1068
														
 
															+# conda install pocl # above gives an warning for installing pocl, not sure if really need this
														
 
															+
														
 
															+# to run ipynb
														
 
															+conda install -n voicecraft ipykernel --no-deps --force-reinstall
														
 
															+
														
 
															+
														
 
															+
														
 
															+# 1. clone the repo on in a directory on a drive with plenty of free space
														
 
															+git clone git@github.com:jasonppy/VoiceCraft.git
														
 
															+cd VoiceCraft
														
 
															+
														
 
															+# 2. assumes you have docker installed with nvidia container container-toolkit (windows has this built into the driver)
														
 
															+# https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/1.13.5/install-guide.html
														
 
															+# sudo apt-get install -y nvidia-container-toolkit-base || yay -Syu nvidia-container-toolkit || echo etc...
														
 
															+
														
 
															+# 3. Try to start an existing container otherwise create a new one passing in all GPUs
														
 
															+./start-jupyter.sh  # linux
														
 
															+start-jupyter.bat   # windows
														
 
															+
														
 
															+# 4. now open a webpage on the host box to the URL shown at the bottom of:
														
 
															+docker logs jupyter
														
 
															+
														
 
															+# 5. optionally look inside from another terminal
														
 
															+docker exec -it jupyter /bin/bash
														
 
															+export USER=(your_linux_username_used_above)
														
 
															+export HOME=/home/$USER
														
 
															+sudo apt-get update
														
 
															+
														
 
															+# 6. confirm video card(s) are visible inside container
														
 
															+nvidia-smi
														
 
															+
														
 
															+# 7. Now in browser, open inference_tts.ipynb and work through one cell at a time
														
 
															+echo GOOD LUCK
														
 
															+```
														
 
															+
														
 
															+推理和训练：
														
 
															+
														
 
															+查看inference_speech_editing.ipynb和inference_tts.ipynb。