Fix missing head_dim in llama config from gguf model (#33526)

fix missing head_dim in llama config from gguf
2025-07-03 12:50:06 +06:00 · 2024-09-18 21:46:12 +08:00 · 2024-09-18 21:46:12 +08:00 · 9f2b8cc45a
commit 9f2b8cc45a
parent db72894b48
1 changed files with 4 additions and 2 deletions
--- a/src/transformers/integrations/ggml.py
+++ b/src/transformers/integrations/ggml.py
@ -120,7 +120,8 @@ GGUF_CONFIG_MAPPING = {
        "block_count": "num_hidden_layers",
        "feed_forward_length": "intermediate_size",
        "embedding_length": "hidden_size",
-        "rope.dimension_count": None,
+        # NOTE: rope.dimension_count==head_dim only suitable for llama/mistral
+        "rope.dimension_count": "head_dim",
        "rope.freq_base": "rope_theta",
        "attention.head_count": "num_attention_heads",
        "attention.head_count_kv": "num_key_value_heads",
@ -132,7 +133,8 @@ GGUF_CONFIG_MAPPING = {
        "block_count": "num_hidden_layers",
        "feed_forward_length": "intermediate_size",
        "embedding_length": "hidden_size",
-        "rope.dimension_count": None,
+        # NOTE: rope.dimension_count==head_dim only suitable for llama/mistral
+        "rope.dimension_count": "head_dim",
        "rope.freq_base": "rope_theta",
        "attention.head_count": "num_attention_heads",
        "attention.head_count_kv": "num_key_value_heads",