2 роки тому · d6425f84b3
--- a/ggml/examples/unity/convert-pt-to-ggml.py
+++ b/ggml/examples/unity/convert-pt-to-ggml.py
@@ -1,22 +1,23 @@
 
															 # Convert UnitY model from PyTorch to ggml format
														
 
															 #
														
 
															 # Usage: python3.8 /private/home/dnn/ggml/ggml/examples/unity/convert-pt-to-ggml.py /large_experiments/seamless/ust/dnn/unity_large_audio_enc.pt /private/home/dnn/ggml/ggml/examples/unity/models/unity-large
														
 
															-# 
														
 
															+#
														
 
															 import io
														
 
															-import sys
														
 
															 import struct
														
 
															-import torch
														
 
															-import numpy as np
														
 
															+import sys
														
 
															 from pathlib import Path
														
 
															-from convert_pt_states import generate_mapping
														
 
															+import numpy as np
														
 
															+import torch
														
 
															+
														
 
															+from convert_pt_states import generate_mapping
														
 
															 if len(sys.argv) < 3:
														
 
															     print("Usage: convert-pt-to-ggml.py model.pt dir-output [use-f32]\n")
														
 
															     sys.exit(1)
														
 
															-fname_inp   = Path(sys.argv[1])
														
 
															-dir_out     = Path(sys.argv[2])
														
 
															+fname_inp = Path(sys.argv[1])
														
 
															+dir_out = Path(sys.argv[2])
														
 
															 # try to load PyTorch binary data
														
 
															 try:
														
@@ -24,10 +25,17 @@ try:
 
															     with io.BytesIO(model_bytes) as fp:
														
 
															         checkpoint = torch.load(fp, map_location="cpu")
														
 
															 except Exception:
														
 
															-    print("Error: failed to load PyTorch model file:" , fname_inp)
														
 
															+    print("Error: failed to load PyTorch model file:", fname_inp)
														
 
															     sys.exit(1)
														
 
															-hparams = {"n_text_vocab": 256064, "n_audio_enc_dim": 1024, "n_audio_enc_ffn_dim": 4096, "n_audio_enc_feat_dim": 160, "n_audio_enc_layer": 24, "n_audio_enc_head": 16}
														
 
															+hparams = {
														
 
															+    "n_text_vocab": 256064,
														
 
															+    "n_audio_enc_dim": 1024,
														
 
															+    "n_audio_enc_ffn_dim": 4096,
														
 
															+    "n_audio_enc_feat_dim": 160,
														
 
															+    "n_audio_enc_layer": 24,
														
 
															+    "n_audio_enc_head": 16,
														
 
															+}
														
 
															 print("hparams:", hparams)
														
 
															 list_vars = checkpoint["model"]
														
@@ -44,19 +52,27 @@ if len(sys.argv) > 4:
 
															 fout = fname_out.open("wb")
														
 
															-fout.write(struct.pack("i", 0x67676d6c)) # magic: ggml in hex
														
 
															+fout.write(struct.pack("i", 0x67676D6C))  # magic: ggml in hex
														
 
															 for key in hparams.keys():
														
 
															     fout.write(struct.pack("i", hparams[key]))
														
 
															 fout.write(struct.pack("i", use_f16))
														
 
															 exclude_list = []
														
 
															-exclude_list += [f"encoder.w2v_encoder.w2v_model.encoder.layers.{i}.conv_module.batch_norm.num_batches_tracked" for i in range(24)]
														
 
															+exclude_list += [
														
 
															+    f"encoder.w2v_encoder.w2v_model.encoder.layers.{i}.conv_module.batch_norm.num_batches_tracked"
														
 
															+    for i in range(24)
														
 
															+]
														
 
															 for name in list_vars.keys():
														
 
															-    if list_vars[name] is None or name in exclude_list or "adaptor" in name or "mask_emb" in name:
														
 
															+    if (
														
 
															+        list_vars[name] is None
														
 
															+        or name in exclude_list
														
 
															+        or "adaptor" in name
														
 
															+        or "mask_emb" in name
														
 
															+    ):
														
 
															         continue
														
 
															     data = list_vars[name].squeeze().numpy()
														
 
															-    print("Processing variable: " , name ,  " with shape: ", data.shape)
														
 
															+    print("Processing variable: ", name, " with shape: ", data.shape)
														
 
															     n_dims = len(data.shape)
														
@@ -68,12 +84,12 @@ for name in list_vars.keys():
 
															     # if 'pos_bias' in name:
														
 
															     #     import pdb; pdb.set_trace()
														
 
															     #     print(data.shape)
														
 
															-    str_ = state_map[name].encode('utf-8')
														
 
															+    str_ = state_map[name].encode("utf-8")
														
 
															     fout.write(struct.pack("iii", n_dims, len(str_), ftype))
														
 
															     for i in range(n_dims):
														
 
															-        if '.layer_norm.weight' in name:
														
 
															+        if ".layer_norm.weight" in name:
														
 
															             print(data.shape)
														
 
															-        fout.write(struct.pack("i", data.shape[n_dims-1-i]))
														
 
															+        fout.write(struct.pack("i", data.shape[n_dims - 1 - i]))
														
 
															     fout.write(str_)
														
 
															     # data
														
@@ -81,6 +97,5 @@ for name in list_vars.keys():
 
															 fout.close()
														
 
															-print("Done. Output file: " , fname_out)
														
 
															+print("Done. Output file: ", fname_out)
														
 
															 print("")
														
 
															-
														
--- a/ggml/examples/unity/convert_pt_states.py
+++ b/ggml/examples/unity/convert_pt_states.py
@@ -1,37 +1,46 @@
 
															 import torch
														
 
															+
														
 
															+
														
 
															 def map_state_key(pytorch_key, layer_idx=None):
														
 
															     # Replace the layer index first
														
 
															     if layer_idx is not None:
														
 
															         pytorch_key = pytorch_key.replace(f".layers.{layer_idx}.", "/")
														
 
															-    
														
 
															+
														
 
															     # Replace common patterns in the state key
														
 
															     translation_dict = {
														
 
															         ".weight": "/w",
														
 
															         ".bias": "/b",
														
 
															-        ".running_mean": "/m", # /running_mean doesn't work
														
 
															+        ".running_mean": "/m",  # /running_mean doesn't work
														
 
															         ".running_var": "/v",
														
 
															         ".num_batches_tracked": "/n",
														
 
															         "self_attn.": "self_attn_",
														
 
															         "conv_module.": "conv_",
														
 
															         "ffn1.": "ffn1_",
														
 
															         "ffn2.": "ffn2_",
														
 
															-        "pos_conv.0": "pos_conv"
														
 
															+        "pos_conv.0": "pos_conv",
														
 
															     }
														
 
															-    
														
 
															-    
														
 
															+
														
 
															     # Special mapping for pos_bias_u and pos_bias_v
														
 
															     if "self_attn.pos_bias_u" in pytorch_key:
														
 
															-        pytorch_key = pytorch_key.replace("self_attn.pos_bias_u", "self_attn_pos_bias/u")
														
 
															+        pytorch_key = pytorch_key.replace(
														
 
															+            "self_attn.pos_bias_u", "self_attn_pos_bias/u"
														
 
															+        )
														
 
															     elif "self_attn.pos_bias_v" in pytorch_key:
														
 
															-        pytorch_key = pytorch_key.replace("self_attn.pos_bias_v", "self_attn_pos_bias/v")
														
 
															+        pytorch_key = pytorch_key.replace(
														
 
															+            "self_attn.pos_bias_v", "self_attn_pos_bias/v"
														
 
															+        )
														
 
															     for pytorch_pattern, model_pattern in translation_dict.items():
														
 
															         pytorch_key = pytorch_key.replace(pytorch_pattern, model_pattern)
														
 
															-    
														
 
															+
														
 
															     # Replace the leading pattern and add layer index
														
 
															     if layer_idx is not None:
														
 
															-        pytorch_key = pytorch_key.replace("encoder.w2v_encoder.w2v_model.encoder/", f"model/enc/h{layer_idx}/")
														
 
															+        pytorch_key = pytorch_key.replace(
														
 
															+            "encoder.w2v_encoder.w2v_model.encoder/", f"model/enc/h{layer_idx}/"
														
 
															+        )
														
 
															     else:
														
 
															-        pytorch_key = pytorch_key.replace("encoder.w2v_encoder.w2v_model.encoder.", f"model/enc/")
														
 
															+        pytorch_key = pytorch_key.replace(
														
 
															+            "encoder.w2v_encoder.w2v_model.encoder.", f"model/enc/"
														
 
															+        )
														
 
															     pytorch_key = pytorch_key.replace("encoder.w2v_encoder.w2v_model.", f"model/")
														
 
															     return pytorch_key
														
@@ -49,12 +58,12 @@ def generate_mapping(state_dict):
 
															 # Testing
														
 
															-ckpt = torch.load('/large_experiments/seamless/ust/dnn/unity_large_audio_enc.pt')
														
 
															+ckpt = torch.load("/large_experiments/seamless/ust/dnn/unity_large_audio_enc.pt")
														
 
															 state_dict = {}
														
 
															-for key in ckpt['model']:
														
 
															-    if ckpt['model'][key] is not None:
														
 
															-        state_dict[key] = ckpt['model'][key]
														
 
															+for key in ckpt["model"]:
														
 
															+    if ckpt["model"][key] is not None:
														
 
															+        state_dict[key] = ckpt["model"][key]
														
 
															 mapped_keys = generate_mapping(state_dict)
														
 
															 for old_key, new_key in mapped_keys.items():
														
 
															-    print(old_key, "=>", new_key)
														
 
															+    print(old_key, "=>", new_key)