|
|
@ -1201,6 +1201,10 @@ def prepare_dataset( files, outdir, language=None, skip_existings=False, progres
|
|
|
|
unload_whisper()
|
|
|
|
unload_whisper()
|
|
|
|
|
|
|
|
|
|
|
|
joined = "\n".join(transcription)
|
|
|
|
joined = "\n".join(transcription)
|
|
|
|
|
|
|
|
if not skip_existings:
|
|
|
|
|
|
|
|
with open(f'{outdir}/train.txt', 'w', encoding="utf-8") as f:
|
|
|
|
|
|
|
|
f.write(joined)
|
|
|
|
|
|
|
|
|
|
|
|
return f"Processed dataset to: {outdir}\n{joined}"
|
|
|
|
return f"Processed dataset to: {outdir}\n{joined}"
|
|
|
|
|
|
|
|
|
|
|
|
def calc_iterations( epochs, lines, batch_size ):
|
|
|
|
def calc_iterations( epochs, lines, batch_size ):
|
|
|
|