1 an în urmă · 2110c89993
--- a/.gitignore
+++ b/.gitignore
@@ -147,3 +147,4 @@ seamless_communication
 
				 !*/seamless_communication
			
 
				 m4t_scripts
			
 
				 /ggml/test_data/
			
 
				+/ggml/dot/
			
--- a/ggml/requirements.txt
+++ b/ggml/requirements.txt
@@ -4,4 +4,5 @@ sentencepiece==0.1.98
 
				 torch==2.0.1
			
 
				 torchaudio==2.0.2
			
 
				 torchvision==0.15.2
			
 
				-transformers==4.29.2
			
 
				+transformers==4.29.2
			
 
				+func_argparse
			
--- a/ggml/test_unity_cpp.py
+++ b/ggml/test_unity_cpp.py
@@ -6,27 +6,27 @@
 
				 
			
 
				 import ctypes
			
 
				 import functools
			
 
				+import shutil
			
 
				 from ctypes import c_void_p
			
 
				 from pathlib import Path
			
 
				-from typing import Any, Iterator, List, Tuple
			
 
				-
			
 
				-import ggml
			
 
				+from typing import Any, Iterator, Tuple
			
 
				 
			
 
				 import fairseq2.nn
			
 
				 import fairseq2.nn.transformer
			
 
				 import numpy as np
			
 
				 import pytest
			
 
				+import requests  # type: ignore
			
 
				 import torch
			
 
				-import torchaudio
			
 
				+import torchaudio  # type: ignore
			
 
				+from ctypes_utils import NULLPTR, Ptr
			
 
				 from fairseq2.data.audio import WaveformToFbankConverter
			
 
				-from seamless_communication.inference.generator import SequenceGeneratorOptions
			
 
				 from fairseq2.models.wav2vec2.feature_extractor import Wav2Vec2FbankFeatureExtractor
			
 
				-from seamless_communication.inference.translator import Modality, Translator
			
 
				+from ggml_convert import convert_model, read_layer_config
			
 
				 
			
 
				-from ctypes_utils import NULLPTR, Ptr
			
 
				+import ggml
			
 
				 from ggml import NativeObj
			
 
				-from ggml_convert import convert_model, read_layer_config
			
 
				-import requests
			
 
				+from seamless_communication.inference.generator import SequenceGeneratorOptions
			
 
				+from seamless_communication.inference.translator import Modality, Translator
			
 
				 
			
 
				 Ctx = ggml.ggml_context_p
			
 
				 
			
@@ -57,6 +57,10 @@ def _ctx() -> Iterator[Ctx]:
 
				                 no_alloc=True,
			
 
				             )
			
 
				         )
			
 
				+
			
 
				+        # Create 'dot' folder for temporary dump of ggml graphs
			
 
				+        (Path(__file__).parent / "dot").mkdir(exist_ok=True)
			
 
				+
			
 
				         with torch.inference_mode():
			
 
				             yield ctx
			
 
				     finally:
			
@@ -88,6 +92,7 @@ def load_pt_model() -> Any:
 
				 
			
 
				 
			
 
				 def download_sample_audio() -> Any:
			
 
				+    Path(DATA).mkdir(exist_ok=True)
			
 
				     response = requests.get(TEST_AUDIO_SAMPLE_URL, stream=True)
			
 
				     with open(DATA / "LJ037-0171_sr16k.wav", "wb") as file:
			
 
				         for chunk in response.iter_content(chunk_size=1024):
			
@@ -159,7 +164,7 @@ def test_Linear_forward(ctx: Ctx, g_model: c_void_p) -> None:
 
				     y_exp = pt_model.text_encoder.layers[0].ffn.inner_proj(x).numpy()
			
 
				     gx = ggml.from_numpy(ctx, x)
			
 
				     gy = ggml.forward("Linear", g_model, "text_encoder.layers.0.ffn.inner_proj", gx)
			
 
				-    gf = ggml.build_and_compute(ctx, gy, dump="dot/test_Linear_forward.dot")
			
 
				+    ggml.build_and_compute(ctx, gy, dump="dot/test_Linear_forward.dot")
			
 
				 
			
 
				     y = ggml.to_numpy(gy)
			
 
				     assert np.allclose(y_exp, y, atol=1e-5)
			
@@ -592,7 +597,7 @@ def test_PositionalEmbedding_forward_with_cache(ctx: Ctx, g_model: c_void_p) ->
 
				                 "text_decoder_frontend.pos_encoder",
			
 
				                 gseq,
			
 
				             )
			
 
				-            gf = ggml.build_and_compute(ctx, gy, dump=t == 1)
			
 
				+            ggml.build_and_compute(ctx, gy, dump=t == 1)
			
 
				             y = ggml.to_numpy(gy)
			
 
				 
			
 
				             y_exp = pos_encoder(seq[:, t : t + 1, :], None, state_bag=state_bag).numpy()