fix W_pack for-loop

ggml-org · cebtenzzre · Sep 14, 2023 · Sep 4, 2023 · Sep 4, 2023 · Sep 4, 2023
commit 306d71be42f5cbac0208d17720b8161a90d7f836
diff --git a/convert-baichuan-hf-to-gguf.py b/convert-baichuan-hf-to-gguf.py
@@ -232,7 +232,7 @@ def parse_args() -> argparse.Namespace:
     model_part = torch.load(f"{dir_model}/{part_name}", map_location="cpu")
 
     tmp=model_part
-    for i in itertools.count():
+    for i in range(block_count):
         if f"model.layers.{i}.self_attn.W_pack.weight" in model_part:
             print(f"Unpacking and permuting layer {i}")
             tmp[f"model.layers.{i}.self_attn.q_proj.weight"]=reverse_hf_permute_part(model_part[f"model.layers.{i}.self_attn.W_pack.weight"],0,head_count,head_count)