Procházet zdrojové kódy

update paths to s3 (#195)

* update paths to s3

* gated models

* revert unnecessary changes
Ning před 1 rokem
rodič
revize
c287c1a4d1

+ 2 - 2
src/seamless_communication/cards/nar_t2u_aligner.yaml

@@ -5,10 +5,10 @@
 # LICENSE file in the root directory of this source tree.
 
 name: nar_t2u_aligner
-char_tokenizer: "file:///checkpoint/krs/unity2/spm_char_lang38_tc.model"
+char_tokenizer: "https://dl.fbaipublicfiles.com/seamless/models/spm_char_lang38_tc.model"
 model_type: unity2_aligner
 model_arch: nar_t2u_aligner
-checkpoint: "file:///large_experiments/seamless/ust/krs/fairseq2_checkpoints/unity2_aligner.pt"
+checkpoint: "https://dl.fbaipublicfiles.com/seamless/models/unity2_aligner.pt"
 num_units: 10000
 unit_langs:
   - arb

+ 2 - 2
src/seamless_communication/cards/seamlessM4T_v2_large.yaml

@@ -7,8 +7,8 @@
 name: seamlessM4T_v2_large
 base: unity_nllb-100
 model_arch: base_v2
-char_tokenizer: "file:///checkpoint/krs/unity2/spm_char_lang38_tc.model"
-checkpoint: "file:///large_experiments/seamless/ust/krs/fairseq2_checkpoints/seamlessM4T_v2_large.pt"
+char_tokenizer: "https://dl.fbaipublicfiles.com/seamless/models/spm_char_lang38_tc.model"
+checkpoint: "https://dl.fbaipublicfiles.com/seamless/models/seamlessM4T_v2_large.pt"
 num_units: 10000
 unit_langs:
   - arb

+ 2 - 2
src/seamless_communication/cards/seamless_expressivity.yaml

@@ -7,8 +7,8 @@
 name: seamless_expressivity
 base: unity_nllb-100
 model_arch: expressivity_v2
-char_tokenizer: "file:///checkpoint/krs/unity2/spm_char_lang38_tc.model"
-checkpoint: "file:///large_experiments/seamless/workstream/expressivity/oss/checkpoints/m2m_expressive_unity.pt"
+char_tokenizer: "https://dl.fbaipublicfiles.com/seamless/models/spm_char_lang38_tc.model"
+checkpoint: "https://github.com/facebookresearch/seamless_communication;gated=true"
 num_units: 10000
 unit_langs:
   - arb

+ 1 - 1
src/seamless_communication/cards/seamless_streaming_monotonic_decoder.yaml

@@ -7,4 +7,4 @@
 name: seamless_streaming_monotonic_decoder
 model_type: monotonic_decoder
 model_arch: dense_1b
-checkpoint: "file:///large_experiments/seamless/ust/krs/fairseq2_checkpoints/seamless_streaming_monotonic_decoder.pt"
+checkpoint: "https://dl.fbaipublicfiles.com/seamless/models/seamless_streaming_monotonic_decoder.pt"

+ 2 - 2
src/seamless_communication/cards/seamless_streaming_unity.yaml

@@ -7,8 +7,8 @@
 name: seamless_streaming_unity
 base: unity_nllb-100
 model_arch: base_v2
-char_tokenizer: "file:///checkpoint/krs/unity2/spm_char_lang38_tc.model"
-checkpoint: "file:///large_experiments/seamless/ust/krs/fairseq2_checkpoints/seamless_streaming_unity.pt"
+char_tokenizer: "https://dl.fbaipublicfiles.com/seamless/models/spm_char_lang38_tc.model"
+checkpoint: "https://dl.fbaipublicfiles.com/seamless/models/seamless_streaming_unity.pt"
 num_units: 10000
 unit_langs:
   - arb

+ 1 - 1
src/seamless_communication/cards/vocoder_pretssel.yaml

@@ -7,7 +7,7 @@
 name: vocoder_pretssel
 model_type: vocoder_pretssel
 model_arch: 24khz
-checkpoint: "file:///large_experiments/seamless/workstream/expressivity/oss/checkpoints/pretssel_melhifigan_wm-final.pt"
+checkpoint: "https://github.com/facebookresearch/seamless_communication;gated=true"
 sample_rate: 24000
 model_config:
   langs:

+ 1 - 1
src/seamless_communication/cards/vocoder_pretssel_16khz.yaml

@@ -7,7 +7,7 @@
 name: vocoder_pretssel_16khz
 model_type: vocoder_pretssel
 model_arch: 16khz
-checkpoint: "file:///large_experiments/seamless/workstream/expressivity/oss/checkpoints/pretssel_melhifigan_wm-16khz.pt"
+checkpoint: "https://github.com/facebookresearch/seamless_communication;gated=true"
 sample_rate: 16000
 model_config:
   langs:

+ 1 - 1
src/seamless_communication/cards/vocoder_v2.yaml

@@ -7,7 +7,7 @@
 name: vocoder_v2
 model_type: vocoder_code_hifigan
 model_arch: base
-checkpoint: "file:///large_experiments/seamless/ust/krs/fairseq2_checkpoints/vocoder_v2.pt"
+checkpoint: "https://dl.fbaipublicfiles.com/seamless/models/vocoder_v2.pt"
 model_config: {
   "lang_spkr_idx_map": {
       "multilingual": {