drewThomasson commited on
Commit
a58e968
·
verified ·
1 Parent(s): 7c8f8d8

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -0
app.py CHANGED
@@ -576,6 +576,8 @@ def convert_chapters_to_audio_custom_model(chapters_dir, output_audio_dir, targe
576
  print(f"Generating fragment: {fragment}...")
577
  fragment_file_path = os.path.join(temp_audio_directory, f"{temp_count}.wav")
578
  if custom_model:
 
 
579
  out = model.inference(fragment, language, gpt_cond_latent, speaker_embedding, temperature=0.7)
580
  torchaudio.save(fragment_file_path, torch.tensor(out["wav"]).unsqueeze(0), 24000)
581
  else:
@@ -624,6 +626,8 @@ def convert_chapters_to_audio_standard_model(chapters_dir, output_audio_dir, tar
624
  fragment_file_path = os.path.join(temp_audio_directory, f"{temp_count}.wav")
625
  speaker_wav_path = target_voice_path if target_voice_path else default_target_voice_path
626
  language_code = language if language else default_language_code
 
 
627
  tts.tts_to_file(text=fragment, file_path=fragment_file_path, speaker_wav=speaker_wav_path, language=language_code)
628
  temp_count += 1
629
 
 
576
  print(f"Generating fragment: {fragment}...")
577
  fragment_file_path = os.path.join(temp_audio_directory, f"{temp_count}.wav")
578
  if custom_model:
579
+ print(f"The TTS language code given is: {language}")
580
+ print(f"The TTS text chunk is: {fragment} ")
581
  out = model.inference(fragment, language, gpt_cond_latent, speaker_embedding, temperature=0.7)
582
  torchaudio.save(fragment_file_path, torch.tensor(out["wav"]).unsqueeze(0), 24000)
583
  else:
 
626
  fragment_file_path = os.path.join(temp_audio_directory, f"{temp_count}.wav")
627
  speaker_wav_path = target_voice_path if target_voice_path else default_target_voice_path
628
  language_code = language if language else default_language_code
629
+ print(f"The TTS language code given is: {language_code}")
630
+ print(f"The TTS text chunk is: {fragment} ")
631
  tts.tts_to_file(text=fragment, file_path=fragment_file_path, speaker_wav=speaker_wav_path, language=language_code)
632
  temp_count += 1
633