Skip to content

Commit

Permalink
Update README.md
Browse files Browse the repository at this point in the history
  • Loading branch information
MaxMax2016 committed Sep 16, 2022
1 parent 902ff61 commit f5ba74b
Showing 1 changed file with 47 additions and 46 deletions.
93 changes: 47 additions & 46 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -6,77 +6,78 @@ https://github.com/mozilla/TTS/tree/master/TTS/speaker_encoder

pip install coqpit

# download model,or get it at **release**
# download model,
https://github.com/mozilla/TTS/wiki/Released-Models

Speaker-Encoder by @mueller91 LibriTTS + VCTK + VoxCeleb + CommonVoice

# please read the config
https://drive.google.com/drive/folders/15oeBYf6Qn1edONkVLXe82MzdIi3O_9m3

Or get it at release **saved_models.zip**

# use
python vi_speaker_single.py ./saved_models/best_model.pth.tar ./saved_models/config.json -s TEST.wav -t TEST.npy

# batch use
python vi_speaker_batch.py ./saved_models/best_model.pth.tar ./saved_models/config.json ./data/waves ./speaker_embedding

data/
└── waves
data/
└── waves
├── spk1
│   ├── 000002.wav
│   ├── 000006.wav
│   └── 000038.wav
└── spk2
├── 000040.wav
├── 000044.wav
└── 000077.wav

speaker_embedding/
├── spk1
│   ├── 000002.wav
│   ├── 000006.wav
│   └── 000038.wav
│   ├── 000002.npy
│   ├── 000006.npy
│   └── 000038.npy
└── spk2
├── 000040.wav
├── 000044.wav
└── 000077.wav

speaker_embedding/
├── spk1
│   ├── 000002.npy
│   ├── 000006.npy
│   └── 000038.npy
└── spk2
├── 000040.npy
├── 000044.npy
└── 000077.npy
├── 000040.npy
├── 000044.npy
└── 000077.npy

# compute speaker center
input path = speaker_embedding, output path = speaker_embedding_center

python vi_speaker_center.py

speaker_embedding_center/
├── spk1.npy
└── spk2.npy
speaker_embedding_center/
├── spk1.npy
└── spk2.npy


# for VI-SVC
mv speaker_embedding_center data/spkid

data/
├── waves
│   ├── 10001
│   ├── 20400
│   │   ├── 20400_001.wav
│   │   ├── 20456_019.wav
│   │  
├── phone
│   ├── 10001
│   ├── 20400
│   │   ├── 20400_001.npy
│   │   ├── 20456_019.npy
│   │  
├── lable
│   ├── 10001
│   ├── 20400
│   │   ├── 20400_001.npy
│   │   ├── 20456_019.npy
│   │  
├── spkid
│   ├── 10001.npy
│   ├── 20400.npy
│   │  
data/
├── waves
│   ├── 10001
│   ├── 20400
│   │   ├── 20400_001.wav
│   │   ├── 20456_019.wav
│   │  
├── phone
│   ├── 10001
│   ├── 20400
│   │   ├── 20400_001.npy
│   │   ├── 20456_019.npy
│   │  
├── lable
│   ├── 10001
│   ├── 20400
│   │   ├── 20400_001.npy
│   │   ├── 20456_019.npy
│   │  
├── spkid
│   ├── 10001.npy
│   ├── 20400.npy
│   │  



0 comments on commit f5ba74b

Please sign in to comment.