forked from mrq/tortoise-tts
read.py combines all candidates
If candidates where greater than 1 on in read.py, only the fist candidate clips would be combined. This adds a bit of code to make a combined file for every candidate.
This commit is contained in:
parent
480f7e37d9
commit
2477a4f763
|
@ -72,6 +72,7 @@ if __name__ == '__main__':
|
||||||
gen = gen[0].squeeze(0).cpu()
|
gen = gen[0].squeeze(0).cpu()
|
||||||
all_parts.append(gen)
|
all_parts.append(gen)
|
||||||
|
|
||||||
|
if args.candidates == 1:
|
||||||
full_audio = torch.cat(all_parts, dim=-1)
|
full_audio = torch.cat(all_parts, dim=-1)
|
||||||
torchaudio.save(os.path.join(voice_outpath, 'combined.wav'), full_audio, 24000)
|
torchaudio.save(os.path.join(voice_outpath, 'combined.wav'), full_audio, 24000)
|
||||||
|
|
||||||
|
@ -80,3 +81,13 @@ if __name__ == '__main__':
|
||||||
dbg_state = (seed, texts, voice_samples, conditioning_latents)
|
dbg_state = (seed, texts, voice_samples, conditioning_latents)
|
||||||
torch.save(dbg_state, f'debug_states/read_debug_{selected_voice}.pth')
|
torch.save(dbg_state, f'debug_states/read_debug_{selected_voice}.pth')
|
||||||
|
|
||||||
|
# Combine each candidate's audio clips.
|
||||||
|
if args.candidates > 1:
|
||||||
|
audio_clips = []
|
||||||
|
for candidate in range(args.candidates):
|
||||||
|
for line in range(len(texts)):
|
||||||
|
wav_file = os.path.join(voice_outpath, str(line), f"{candidate}.wav")
|
||||||
|
audio_clips.append(load_audio(wav_file, 24000))
|
||||||
|
audio_clips = torch.cat(audio_clips, dim=-1)
|
||||||
|
torchaudio.save(os.path.join(voice_outpath, f"combined_{candidate:02d}.wav"), audio_clips, 24000)
|
||||||
|
audio_clips = []
|
Loading…
Reference in New Issue
Block a user