2 years ago · f7d2c90ceb
--- a/ggml/ggml.py
+++ b/ggml/ggml.py
@@ -59,6 +59,11 @@ def nb(tensor: Union[ggml_tensor, ggml_tensor_p]) -> Tuple[int, ...]:
 
				         tensor = tensor.contents
			
 
				     return tuple([tensor.nb[i] for i in range(4)])
			
 
				 
			
 
				+def ne(tensor: Union[ggml_tensor, ggml_tensor_p]) -> Tuple[int, ...]:
			
 
				+    if isinstance(tensor, ctypes._Pointer):
			
 
				+        tensor = tensor.contents
			
 
				+    return tuple([tensor.ne[i] for i in range(4)])
			
 
				+
			
 
				 
			
 
				 def strides(tensor: Union[ggml_tensor, ggml_tensor_p]) -> Tuple[int, ...]:
			
 
				     if isinstance(tensor, ctypes._Pointer):
			
@@ -71,7 +76,8 @@ def strides(tensor: Union[ggml_tensor, ggml_tensor_p]) -> Tuple[int, ...]:
 
				 
			
 
				 def to_numpy(tensor_p: ggml_tensor_p) -> np.ndarray:
			
 
				     if not ggml_is_contiguous(tensor_p):
			
 
				-        return _strided_to_numpy(tensor_p)
			
 
				+        if not _almost_contiguous(tensor_p):
			
 
				+            return _strided_to_numpy(tensor_p)
			
 
				     tensor = tensor_p.contents
			
 
				 
			
 
				     res = _void_p_to_np_array(tensor.data, shape(tensor), numpy_dtype(tensor.type))
			
@@ -83,6 +89,24 @@ def to_numpy(tensor_p: ggml_tensor_p) -> np.ndarray:
 
				     return res
			
 
				 
			
 
				 
			
 
				+def _almost_contiguous(tensor_p: ggml_tensor_p) -> bool:
			
 
				+    """Distinguishes between fully strided and just transposed."""
			
 
				+    tensor = tensor_p.contents
			
 
				+    num_bytes = nb(tensor)
			
 
				+    num_elem = ne(tensor)
			
 
				+
			
 
				+    # Sort the axis according to 'num_bytes'
			
 
				+    nbe = sorted(zip(num_bytes, num_elem))
			
 
				+    itemsize = ggml_type_size(tensor.type)
			
 
				+    stride_exp = itemsize
			
 
				+    for stride, e in nbe:
			
 
				+        if stride != stride_exp:
			
 
				+            return False
			
 
				+        stride_exp *= e
			
 
				+
			
 
				+    return True
			
 
				+
			
 
				+
			
 
				 def _strided_to_numpy(tensor_p: ggml_tensor_p) -> np.ndarray:
			
 
				     if ggml_is_transposed(tensor_p):
			
 
				         raise NotImplementedError(
			
--- a/ggml/test_ggml_integration.py
+++ b/ggml/test_ggml_integration.py
@@ -227,12 +227,7 @@ def test_to_numpy_works_with_transposed(ctx: Ctx) -> None:
 
				     a[...] = np.arange(50).reshape(5, 10).astype(dtype=np.float32)
			
 
				 
			
 
				     gat = ggml.ggml_transpose(ctx, ga)
			
 
				-
			
 
				-    gf = ggml.ggml_build_forward(ga)
			
 
				-    ggml.ggml_graph_compute_with_ctx(ctx, ctypes.pointer(gf), 1)
			
 
				-
			
 
				     at = ggml.to_numpy(gat)
			
 
				-
			
 
				     assert np.allclose(a.T, at)
			
 
				 
			
 
				 
			
@@ -242,19 +237,30 @@ def test_ggml_slice(ctx: Ctx) -> None:
 
				     a[...] = np.arange(50).reshape(5, 10).astype(dtype=np.float32)
			
 
				 
			
 
				     gs0 = ggml.ggml_slice(ctx, ga, 0, 3, 7)
			
 
				-    gf = ggml.ggml_build_forward(ga)
			
 
				-    ggml.ggml_graph_compute_with_ctx(ctx, ctypes.pointer(gf), 1)
			
 
				     s0 = ggml.to_numpy(gs0)
			
 
				-
			
 
				     assert np.allclose(a[:, 3:7], s0)
			
 
				 
			
 
				     gs1 = ggml.ggml_slice(ctx, ga, 1, 2, 5)
			
 
				-    gf = ggml.ggml_build_forward(ga)
			
 
				-    ggml.ggml_graph_compute_with_ctx(ctx, ctypes.pointer(gf), 1)
			
 
				     s1 = ggml.to_numpy(gs1)
			
 
				     assert np.allclose(a[2:5, :], s1)
			
 
				 
			
 
				 
			
 
				+@pytest.mark.xfail(reason="not implemented")
			
 
				+def test_ggml_transpose_and_slice(ctx: Ctx) -> None:
			
 
				+    ga = ggml.ggml_new_tensor_2d(ctx, ggml.GGML_TYPE_F32, 10, 5)
			
 
				+    a = ggml.to_numpy(ga)
			
 
				+    a[...] = np.arange(50).reshape(5, 10).astype(dtype=np.float32)
			
 
				+
			
 
				+    gat = ggml.ggml_transpose(ctx, ga)
			
 
				+    gs0 = ggml.ggml_slice(ctx, gat, 0, 2, 5)
			
 
				+    s0 = ggml.to_numpy(gs0)
			
 
				+    assert np.allclose(a.T[:, 2:5], s0)
			
 
				+
			
 
				+    gs1 = ggml.ggml_slice(ctx, gat, 1, 3, 7)
			
 
				+    s1 = ggml.to_numpy(gs1)
			
 
				+    assert np.allclose(a.T[3:7, :], s1)
			
 
				+
			
 
				+
			
 
				 def test_numpy_mul_mat(ctx: Ctx) -> None:
			
 
				     slen, d_in, d_out = (5, 4, 2)
			
 
				     # torch.nn and fairseq2.nn assumes (seq_len, dim) to represent inputs,