llama-model : add Glm4Model implementation for GLM-4-0414 (#12867)

* GLM-4-0414 * use original one * Using with tensor map * fix bug * change order * change order * format with flask8
2025-04-11 18:10:10 +08:00 · 2025-04-11 18:10:10 +08:00 · 06bb53ad9b
commit 06bb53ad9b
parent 0c50923944
9 changed files with 273 additions and 4 deletions
--- a/convert_hf_to_gguf_update.py
+++ b/convert_hf_to_gguf_update.py
@ -114,6 +114,7 @@ models = [
    {"name": "trillion",         "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/trillionlabs/Trillion-7B-preview", },
    {"name": "bailingmoe",       "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/inclusionAI/Ling-lite", },
    {"name": "llama4",           "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/meta-llama/Llama-4-Scout-17B-16E-Instruct", },
+    {"name": "glm4",             "tokt": TOKENIZER_TYPE.BPE, "repo": "https://huggingface.co/THUDM/glm-4-9b-hf", },
 ]