1
0
Fork 0

some cleanup

master
mrq 2023-03-09 06:20:05 +07:00
parent 5460e191b0
commit 2f6dd9c076
1 changed files with 21 additions and 11 deletions

@ -171,8 +171,14 @@ def read_generate_settings_proxy(file, saveAs='.temp'):
gr.update(visible=j is not None),
)
def prepare_dataset_proxy( voice, language, skip_existings, progress=gr.Progress(track_tqdm=True) ):
return prepare_dataset( get_voices(load_latents=False)[voice], outdir=f"./training/{voice}/", language=language, skip_existings=skip_existings, progress=progress )
def prepare_dataset_proxy( voice, language, validation_size, skip_existings, progress=gr.Progress(track_tqdm=True) ):
messages = []
message = prepare_dataset( get_voices(load_latents=False)[voice], outdir=f"./training/{voice}/", language=language, skip_existings=skip_existings, progress=progress )
messages.append(message)
if validation_size > 0:
message = prepare_validation_dataset( voice, text_length=validation_size )
messages.append(message)
return "\n".join(messages)
def update_args_proxy( *args ):
kwargs = {}
@ -377,14 +383,18 @@ def setup_gradio():
with gr.Tab("Prepare Dataset"):
with gr.Row():
with gr.Column():
dataset_settings = [
gr.Dropdown( choices=voice_list, label="Dataset Source", type="value", value=voice_list[0] if len(voice_list) > 0 else "" ),
gr.Textbox(label="Language", value="en"),
gr.Checkbox(label="Skip Already Transcribed", value=False)
]
transcribe_button = gr.Button(value="Transcribe")
validation_text_cull_size = gr.Number(label="Validation Text Length Cull Size", value=12, precision=0)
prepare_validation_button = gr.Button(value="Prepare Validation")
DATASET_SETTINGS = {}
DATASET_SETTINGS['voice'] = gr.Dropdown( choices=voice_list, label="Dataset Source", type="value", value=voice_list[0] if len(voice_list) > 0 else "" )
with gr.Row():
DATASET_SETTINGS['language'] = gr.Textbox(label="Language", value="en")
DATASET_SETTINGS['validation_size'] = gr.Number(label="Validation Text Length Cull Size", value=12, precision=0)
DATASET_SETTINGS['skip'] = gr.Checkbox(label="Skip Already Transcribed", value=False)
with gr.Row():
transcribe_button = gr.Button(value="Transcribe")
prepare_validation_button = gr.Button(value="Prepare Validation")
dataset_settings = list(DATASET_SETTINGS.values())
with gr.Column():
prepare_dataset_output = gr.TextArea(label="Console Output", interactive=False, max_lines=8)
with gr.Tab("Generate Configuration"):
@ -692,7 +702,7 @@ def setup_gradio():
prepare_validation_dataset,
inputs=[
dataset_settings[0],
validation_text_cull_size,
DATASET_SETTINGS['validation_size'],
],
outputs=prepare_dataset_output #console_output
)