Эх сурвалжийг харах

dimension increases for pretssel model output (#164)

Yilin Yang 1 жил өмнө
parent
commit
cd280d5245

+ 1 - 1
src/seamless_communication/streaming/agents/pretssel_vocoder.py

@@ -95,7 +95,7 @@ class PretsselVocoderAgent(NoUpdateTargetMixin, TextToSpeechAgent):
 
         return WriteAction(
             SpeechSegment(
-                content=wav[0][0].tolist(),
+                content=wav[0][0][0].tolist(),
                 finished=states.source_finished,
                 sample_rate=self.vocoder_sample_rate,
                 tgt_lang=tgt_lang,