Kaynağa Gözat

Fix potential issue with downloading Gigaspeech (#458)

Alisamar Husain 1 yıl önce
ebeveyn
işleme
0b89c34ecc

+ 1 - 1
src/seamless_communication/cli/m4t/finetune/dataset.py

@@ -158,7 +158,7 @@ def download_fleurs(
 
 
 def download_gigaspeech(subset: str, huggingface_token: str, save_directory: str):
-    ds = load_dataset("speechcolab/gigaspeech", subset, cache_dir=f"gigaspeech/{subset}", token=huggingface_token)
+    ds = load_dataset("speechcolab/gigaspeech", subset, cache_dir=save_directory, token=huggingface_token)
     for split in ds:
         manifest_path = os.path.join(save_directory, f"{subset}_{split}_manifest.json")
         logger.info(f"Preparing {split} split...")