From b721e395b5b7d41ecd8e4b2858f4c49a456d4ae2 Mon Sep 17 00:00:00 2001 From: mrq Date: Wed, 15 Feb 2023 04:44:14 +0000 Subject: [PATCH] modified conversion scripts to not give a shit about bitrate and formats since torchaudio.load handles all of that anyways, and it all gets resampled anyways --- README.md | 1 + convert/convert.bat | 2 +- convert/convert.sh | 2 +- 3 files changed, 3 insertions(+), 2 deletions(-) mode change 100644 => 100755 convert/convert.sh diff --git a/README.md b/README.md index 478a851..e5c9da2 100755 --- a/README.md +++ b/README.md @@ -195,6 +195,7 @@ You'll be presented with a bunch of options in the default `Generate` tab, but d - this is a very tricky setting to suggest, as there's not necessarily a go-to solution + some samples seem to work best if it's just one whole chunk + other voices seem to work better if i split it up more + + I'm *very* sure the best way to go about it is for it to compute latents per sentence, then average, but that's tedious. - the best advice is to just play around with it a bit; pick the lowest chunk size you can make, and if a voice doesn't quite replicate right, increase the chunk count. * `(Re)Compute Voice Latents`: regenerates a voice's cached latents. diff --git a/convert/convert.bat b/convert/convert.bat index adb1742..4ccfd61 100755 --- a/convert/convert.bat +++ b/convert/convert.bat @@ -1,4 +1,4 @@ @echo off rm .\in\.gitkeep rm .\out\.gitkeep -for %%a in (".\in\*.*") do ffmpeg -i "%%a" -ar 22050 -ac 1 -c:a pcm_f32le ".\out\%%~na.wav" \ No newline at end of file +for %%a in (".\in\*.*") do ffmpeg -i "%%a" -ac 1 ".\out\%%~na.wav" \ No newline at end of file diff --git a/convert/convert.sh b/convert/convert.sh old mode 100644 new mode 100755 index f1e4092..24a29c0 --- a/convert/convert.sh +++ b/convert/convert.sh @@ -1 +1 @@ -for a in $(find "in/" -maxdepth 1 -not -name '.gitkeep' -type f); do ffmpeg -i "$a" -ar 22050 -ac 1 -c:a pcm_f32le "out/$(basename $a).wav"; done \ No newline at end of file +for a in $(find "in/" -maxdepth 1 -not -name '.gitkeep' -type f); do ffmpeg -i "$a" -ac 1 "out/$(basename $a).wav"; done \ No newline at end of file