Fix loading Llama-3_3-Nemotron-Super-49B-v1 and similar models (closes #7012)

2025-06-07 14:17:09 -04:00 · 2025-05-25 17:19:26 -07:00 · 2025-05-25 17:19:26 -07:00 · bae1aa34aa
commit bae1aa34aa
parent 7f6579ab20
1 changed files with 1 additions and 1 deletions
--- a/modules/models_settings.py
+++ b/modules/models_settings.py
@ -335,7 +335,7 @@ def estimate_vram(gguf_file, gpu_layers, ctx_size, cache_type):
        if key.endswith('.block_count'):
            n_layers = value
        elif key.endswith('.attention.head_count_kv'):
-            n_kv_heads = value
+            n_kv_heads = max(value) if isinstance(value, list) else value
        elif key.endswith('.embedding_length'):
            embedding_dim = value