forked from camenduru/ai-voice-cloning
added the mysterious tortoise_compat flag mentioned in DLAS repo
This commit is contained in:
parent
3b4f4500d1
commit
b8867a5fb0
2
dlas
2
dlas
|
@ -1 +1 @@
|
||||||
Subproject commit 0ee0f46596158aa1d6b8f95b1e7637785c616ee3
|
Subproject commit 84c8196da5686995e0632a0e0f5539f5549bbdd8
|
|
@ -95,7 +95,7 @@ steps:
|
||||||
networks:
|
networks:
|
||||||
gpt:
|
gpt:
|
||||||
type: generator
|
type: generator
|
||||||
which_model_G: unified_voice2 # none of the unified_voice*.py files actually match the tortoise inference code... 4 and 3 have "alignment_head" (wtf is that?), 2 lacks the types=1 parameter.
|
which_model_G: unified_voice2
|
||||||
kwargs:
|
kwargs:
|
||||||
layers: 30 # originally: 8
|
layers: 30 # originally: 8
|
||||||
model_dim: 1024 # originally: 512
|
model_dim: 1024 # originally: 512
|
||||||
|
@ -112,8 +112,8 @@ networks:
|
||||||
train_solo_embeddings: False # missing in uv3/4
|
train_solo_embeddings: False # missing in uv3/4
|
||||||
use_mel_codes_as_input: True # ditto
|
use_mel_codes_as_input: True # ditto
|
||||||
checkpointing: True
|
checkpointing: True
|
||||||
#types: 1 # this is MISSING, but in my analysis 1 is equivalent to not having it.
|
tortoise_compat: True
|
||||||
#only_alignment_head: False # uv3/4
|
# freeze_everything_but_position_embeddings: True
|
||||||
|
|
||||||
path:
|
path:
|
||||||
strict_load: true
|
strict_load: true
|
||||||
|
|
Loading…
Reference in New Issue
Block a user