Skip to content

Commit 9c024b0

Browse files
author
nonstoptimm
committed
bug fix for transcription
1 parent 891903a commit 9c024b0

File tree

2 files changed

+4
-3
lines changed

2 files changed

+4
-3
lines changed

src/glue.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -76,7 +76,7 @@
7676
logging.info('[INFO] - Starting with speech-to-text conversion')
7777
stt_results = stt.main(f'{audio_files}/', f'{output_folder}/{case}')
7878
df_transcription = pd.DataFrame(list(stt_results), columns=['audio', 'rec'])
79-
logging.debug(transcription)
79+
logging.debug(df_transcription)
8080
df_transcription.to_csv(f'{output_folder}/{case}/stt_transcriptions.txt', sep = '\t', header = None, index=False)
8181
# Merge reference transcriptions with recognition on audio file names
8282
if 'audio' in list(df_reference.columns):

src/tts.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -181,8 +181,9 @@ def main(df, output_directory, custom=True, telephone=True):
181181
fname = "nan"
182182
audio_synth.append(fname)
183183
df['audio_synth'] = audio_synth
184-
df['text_clean'] = df.text.apply(remove_tags)
184+
df['text_ssml'] = df['text'].copy()
185+
df['text'] = df['text_ssml'].apply(remove_tags)
185186
return df
186187

187188
if __name__ == '__main__':
188-
main(pd.DataFrame({'text': ['Ich möchte diesen Teppicht nicht kaufen', 'Was geht los da rein?']}), "output/test")
189+
main(pd.DataFrame({'text': ['This is a test', 'And this is another test!']}), "output/test")

0 commit comments

Comments
 (0)