Browse Source

dimension increases for pretssel model output (#164)

Yilin Yang 1 year ago
parent
commit
cd280d5245
1 changed files with 1 additions and 1 deletions
  1. 1 1
      src/seamless_communication/streaming/agents/pretssel_vocoder.py

+ 1 - 1
src/seamless_communication/streaming/agents/pretssel_vocoder.py

@@ -95,7 +95,7 @@ class PretsselVocoderAgent(NoUpdateTargetMixin, TextToSpeechAgent):
 
         return WriteAction(
             SpeechSegment(
-                content=wav[0][0].tolist(),
+                content=wav[0][0][0].tolist(),
                 finished=states.source_finished,
                 sample_rate=self.vocoder_sample_rate,
                 tgt_lang=tgt_lang,