forked from mrq/DL-Art-School
fast_paired
This commit is contained in:
parent
1d30d79e34
commit
b6190e96b2
|
@ -37,6 +37,7 @@ class FastPairedVoiceDataset(torch.utils.data.Dataset):
|
||||||
|
|
||||||
In practice, this means two things:
|
In practice, this means two things:
|
||||||
1) Index {i} of this dataset means nothing: fetching from the same index will almost always return different data.
|
1) Index {i} of this dataset means nothing: fetching from the same index will almost always return different data.
|
||||||
|
As a result, this dataset should not be used for validation or test runs.
|
||||||
2) This dataset has a slight bias for items with longer text or longer filenames.
|
2) This dataset has a slight bias for items with longer text or longer filenames.
|
||||||
|
|
||||||
The upshot is that this dataset loads extremely quickly and consumes almost no system memory.
|
The upshot is that this dataset loads extremely quickly and consumes almost no system memory.
|
||||||
|
@ -172,7 +173,7 @@ if __name__ == '__main__':
|
||||||
batch_sz = 16
|
batch_sz = 16
|
||||||
params = {
|
params = {
|
||||||
'mode': 'fast_paired_voice_audio',
|
'mode': 'fast_paired_voice_audio',
|
||||||
'path': ['Y:\\clips\\books1\\transcribed-w2v.tsv'],
|
'path': ['Y:\\libritts\\train-clean-360\\transcribed-w2v.tsv', 'Y:\\clips\\books1\\transcribed-w2v.tsv'],
|
||||||
'phase': 'train',
|
'phase': 'train',
|
||||||
'n_workers': 0,
|
'n_workers': 0,
|
||||||
'batch_size': batch_sz,
|
'batch_size': batch_sz,
|
||||||
|
@ -200,7 +201,7 @@ if __name__ == '__main__':
|
||||||
for i, b in tqdm(enumerate(dl)):
|
for i, b in tqdm(enumerate(dl)):
|
||||||
for ib in range(batch_sz):
|
for ib in range(batch_sz):
|
||||||
print(f'{i} {ib} {b["real_text"][ib]}')
|
print(f'{i} {ib} {b["real_text"][ib]}')
|
||||||
#save(b, i, ib, 'wav')
|
save(b, i, ib, 'wav')
|
||||||
#if i > 5:
|
if i > 5:
|
||||||
# break
|
break
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue
Block a user