under bark, properly use transcribed audio if the audio wasn't actually sliced (oops)

2023-07-11 14:53:32 +00:00 · 2023-07-11 14:53:32 +00:00 · e2a6dc1c0a
commit e2a6dc1c0a
parent a325496661
1 changed files with 24 additions and 1 deletions
--- a/src/utils.py
+++ b/src/utils.py
@ -192,13 +192,36 @@ if BARK_ENABLED:
 			candidates = []
 			for file in transcriptions:
 				result = transcriptions[file]
+				added = 0
+
 				for segment in result['segments']:
+					path = file.replace(".wav", f"_{pad(segment['id'], 4)}.wav")
+					# check if the slice actually exists
+					if not os.path.exists(f'./training/{voice}/audio/{path}'):
+						continue
+
 					entry = (
-						file.replace(".wav", f"_{pad(segment['id'], 4)}.wav"),
+						path,
 						segment['end'] - segment['start'],
 						segment['text']
 					)
 					candidates.append(entry)
+					added = added + 1
+
+				# if nothing got added (assuming because nothign was sliced), use the master file
+				if added == 0: # added < len(result['segments']):
+					start = 0
+					end = 0
+					for segment in result['segments']:
+						start = max( start, segment['start'] )
+						end = max( end, segment['end'] )
+
+					entry = (
+						file,
+						end - start,
+						result['text']
+					)
+					candidates.append(entry)

 			candidates.sort(key=lambda x: x[1])
 			candidate = random.choice(candidates)