This commit is contained in:
enhuiz 2023-01-13 01:04:48 +08:00
parent 1903d7bb4e
commit 02ed659d2b

View File

@ -1,5 +1,3 @@
![Image from VALL-E paper.](https://valle-demo.github.io/pics/Overview.jpg)
# VALL-E
An unofficial PyTorch implementation of [VALL-E](https://valle-demo.github.io/), based on the [EnCodec](https://github.com/facebookresearch/encodec) tokenizer.
@ -50,7 +48,7 @@ python -m vall_e.train yaml=config/your_data/ar_or_nar.yml
## Citations
```
```bibtex
@article{wang2023neural,
title={Neural Codec Language Models are Zero-Shot Text to Speech Synthesizers},
author={Wang, Chengyi and Chen, Sanyuan and Wu, Yu and Zhang, Ziqiang and Zhou, Long and Liu, Shujie and Chen, Zhuo and Liu, Yanqing and Wang, Huaming and Li, Jinyu and others},
@ -59,7 +57,7 @@ python -m vall_e.train yaml=config/your_data/ar_or_nar.yml
}
```
```
```bibtex
@article{defossez2022highfi,
title={High Fidelity Neural Audio Compression},
author={Défossez, Alexandre and Copet, Jade and Synnaeve, Gabriel and Adi, Yossi},