warnold-nv commited on 9 days ago

Commit

ed14abf

verified ·

1 Parent(s): a95f37e

Add files using upload-large-folder tool

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +2 -0
chat_template.jinja +86 -0
config.json +77 -0
generation_config.json +11 -0
hf_quant_config.json +14 -0
model-00001-of-00071.safetensors +3 -0
model-00002-of-00071.safetensors +3 -0
model-00003-of-00071.safetensors +3 -0
model-00004-of-00071.safetensors +3 -0
model-00006-of-00071.safetensors +3 -0
model-00007-of-00071.safetensors +3 -0
model-00010-of-00071.safetensors +3 -0
model-00011-of-00071.safetensors +3 -0
model-00012-of-00071.safetensors +3 -0
model-00014-of-00071.safetensors +3 -0
model-00015-of-00071.safetensors +3 -0
model-00016-of-00071.safetensors +3 -0
model-00018-of-00071.safetensors +3 -0
model-00019-of-00071.safetensors +3 -0
model-00021-of-00071.safetensors +3 -0
model-00022-of-00071.safetensors +3 -0
model-00023-of-00071.safetensors +3 -0
model-00026-of-00071.safetensors +3 -0
model-00027-of-00071.safetensors +3 -0
model-00028-of-00071.safetensors +3 -0
model-00029-of-00071.safetensors +3 -0
model-00031-of-00071.safetensors +3 -0
model-00032-of-00071.safetensors +3 -0
model-00036-of-00071.safetensors +3 -0
model-00038-of-00071.safetensors +3 -0
model-00039-of-00071.safetensors +3 -0
model-00040-of-00071.safetensors +3 -0
model-00044-of-00071.safetensors +3 -0
model-00046-of-00071.safetensors +3 -0
model-00047-of-00071.safetensors +3 -0
model-00048-of-00071.safetensors +3 -0
model-00049-of-00071.safetensors +3 -0
model-00051-of-00071.safetensors +3 -0
model-00052-of-00071.safetensors +3 -0
model-00054-of-00071.safetensors +3 -0
model-00056-of-00071.safetensors +3 -0
model-00059-of-00071.safetensors +3 -0
model-00062-of-00071.safetensors +3 -0
model-00064-of-00071.safetensors +3 -0
model-00067-of-00071.safetensors +3 -0
model-00069-of-00071.safetensors +3 -0
model-00071-of-00071.safetensors +3 -0
model.safetensors.index.json +3 -0
special_tokens_map.json +34 -0
tokenizer.json +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+model.safetensors.index.json filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

chat_template.jinja ADDED Viewed

	@@ -0,0 +1,86 @@

+[gMASK]<sop>
+{%- if tools -%}
+<|system|>
+# Tools
+You may call one or more functions to assist with the user query.
+You are provided with function signatures within <tools></tools> XML tags:
+<tools>
+{% for tool in tools %}
+{{ tool | tojson(ensure_ascii=False) }}
+{% endfor %}
+</tools>
+For each function call, output the function name and arguments within the following XML format:
+<tool_call>{function-name}<arg_key>{arg-key-1}</arg_key><arg_value>{arg-value-1}</arg_value><arg_key>{arg-key-2}</arg_key><arg_value>{arg-value-2}</arg_value>...</tool_call>{%- endif -%}
+{%- macro visible_text(content) -%}
+    {%- if content is string -%}
+        {{- content }}
+    {%- elif content is iterable and content is not mapping -%}
+        {%- for item in content -%}
+            {%- if item is mapping and item.type == 'text' -%}
+                {{- item.text }}
+            {%- elif item is string -%}
+                {{- item }}
+            {%- endif -%}
+        {%- endfor -%}
+    {%- else -%}
+        {{- content }}
+    {%- endif -%}
+{%- endmacro -%}
+{%- set ns = namespace(last_user_index=-1) %}
+{%- for m in messages %}
+    {%- if m.role == 'user' %}
+        {% set ns.last_user_index = loop.index0 -%}
+    {%- endif %}
+{%- endfor %}
+{% for m in messages %}
+{%- if m.role == 'user' -%}<|user|>{{ visible_text(m.content) }}
+{%- elif m.role == 'assistant' -%}
+<|assistant|>
+{%- set reasoning_content = '' %}
+{%- set content = visible_text(m.content) %}
+{%- if m.reasoning_content is string %}
+    {%- set reasoning_content = m.reasoning_content %}
+{%- else %}
+    {%- if '</think>' in content %}
+        {%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
+        {%- set content = content.split('</think>')[-1].lstrip('\n') %}
+    {%- endif %}
+{%- endif %}
+{%- if ((clear_thinking is defined and not clear_thinking) or loop.index0 > ns.last_user_index) and reasoning_content -%}
+{{ '<think>' + reasoning_content.strip() +  '</think>'}}
+{%- else -%}
+{{ '</think>' }}
+{%- endif -%}
+{%- if content.strip() -%}
+{{ content.strip() }}
+{%- endif -%}
+{% if m.tool_calls %}
+{% for tc in m.tool_calls %}
+{%- if tc.function %}
+    {%- set tc = tc.function %}
+{%- endif %}
+{{- '<tool_call>' + tc.name -}}
+{% set _args = tc.arguments %}{% for k, v in _args.items() %}<arg_key>{{ k }}</arg_key><arg_value>{{ v | tojson(ensure_ascii=False) if v is not string else v }}</arg_value>{% endfor %}</tool_call>{% endfor %}
+{% endif %}
+{%- elif m.role == 'tool' -%}
+{%- if m.content is string -%}
+{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
+    {{- '<|observation|>' }}
+{%- endif %}
+{{- '<tool_response>' }}
+{{- m.content }}
+{{- '</tool_response>' }}
+{%- else -%}
+<|observation|>{% for tr in m.content %}
+<tool_response>{{ tr.output if tr.output is defined else tr }}</tool_response>{% endfor -%}
+{% endif -%}
+{%- elif m.role == 'system' -%}
+<|system|>{{ visible_text(m.content) }}
+{%- endif -%}
+{%- endfor -%}
+{%- if add_generation_prompt -%}
+    <|assistant|>{{- '</think>' if (enable_thinking is defined and not enable_thinking) else '<think>' -}}
+{%- endif -%}

config.json ADDED Viewed

	@@ -0,0 +1,77 @@

+{
+    "architectures": [
+        "Glm4MoeForCausalLM"
+    ],
+    "attention_bias": true,
+    "attention_dropout": 0.0,
+    "dtype": "bfloat16",
+    "eos_token_id": [
+        151329,
+        151336,
+        151338
+    ],
+    "first_k_dense_replace": 3,
+    "head_dim": 128,
+    "hidden_act": "silu",
+    "hidden_size": 5120,
+    "initializer_range": 0.02,
+    "intermediate_size": 12288,
+    "max_position_embeddings": 202752,
+    "model_type": "glm4_moe",
+    "moe_intermediate_size": 1536,
+    "n_group": 1,
+    "n_routed_experts": 160,
+    "n_shared_experts": 1,
+    "norm_topk_prob": true,
+    "num_attention_heads": 96,
+    "num_experts_per_tok": 8,
+    "num_hidden_layers": 92,
+    "num_key_value_heads": 8,
+    "num_nextn_predict_layers": 1,
+    "pad_token_id": 151329,
+    "partial_rotary_factor": 0.5,
+    "rms_norm_eps": 1e-05,
+    "rope_scaling": null,
+    "rope_theta": 1000000,
+    "routed_scaling_factor": 2.5,
+    "tie_word_embeddings": false,
+    "topk_group": 1,
+    "transformers_version": "4.57.1",
+    "use_cache": true,
+    "use_qk_norm": true,
+    "vocab_size": 151552,
+    "quantization_config": {
+        "config_groups": {
+            "group_0": {
+                "input_activations": {
+                    "dynamic": false,
+                    "num_bits": 8,
+                    "type": "float"
+                },
+                "weights": {
+                    "dynamic": false,
+                    "num_bits": 8,
+                    "type": "float"
+                },
+                "targets": [
+                    "Linear"
+                ]
+            }
+        },
+        "ignore": [
+            "lm_head",
+            "model.layers.92*"
+        ],
+        "quant_algo": "FP8",
+        "kv_cache_scheme": {
+            "dynamic": false,
+            "num_bits": 8,
+            "type": "float"
+        },
+        "producer": {
+            "name": "modelopt",
+            "version": "0.42.0rc1.dev9+ge53ca61b7"
+        },
+        "quant_method": "modelopt"
+    }
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,11 @@

+{
+  "_from_model_config": true,
+  "eos_token_id": [
+    151329,
+    151336,
+    151338
+  ],
+  "pad_token_id": 151329,
+  "temperature": 1.0,
+  "transformers_version": "4.56.2"
+}

hf_quant_config.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+    "producer": {
+        "name": "modelopt",
+        "version": "0.42.0rc1.dev9+ge53ca61b7"
+    },
+    "quantization": {
+        "quant_algo": "FP8",
+        "kv_cache_quant_algo": "FP8",
+        "exclude_modules": [
+            "lm_head",
+            "model.layers.92*"
+        ]
+    }
+}

model-00001-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a9fe7e2a9f7ae1423b3c67f1038d4484437628a9df0e85091894b1428966cc0
+size 4999379848

model-00002-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4399dba86b3ffbcf79f757eabc381ac08525119ebc31cbb733da44542fcdb12
+size 4998372816

model-00003-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4906e51155ec8aeacd93d6bef0eb7b170fd403cb42fbae1b4d907b098083c1a
+size 4994814792

model-00004-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2ea6fcf69bfe7893f2d72f20524b22829ca7a534a02ee9e1c06f5d49134d1791
+size 4998372416

model-00006-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:86ed4fd8fc5777b046e58bdeffa91375547ba3f0e275d58fb8b030ab5e16d420
+size 4998372824

model-00007-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:11c762199b9941a2d014ceb111826b9a66aab16217f04f6d8eee3d3b5fa20abd
+size 4994816176

model-00010-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7e4162684af6e7d33b55fa66fdced487ed64298a4095df4752953b6d7b54c037
+size 4994816648

model-00011-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:266af5abb658587ca21d23f0b50dc6752471d47ed489cda75b4e68849844adc3
+size 4998374232

model-00012-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:883202738bd8fecb14b45512d1446cb40c00f035e17744aede260e52cce028e6
+size 4998374296

model-00014-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb0266602d75db7623b31d9b30b1a36a795ce5992fa59e3a43916fb3711dc278
+size 4994816624

model-00015-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:216561e9da7eee80b5b3c82d78eb1867bb884508892c7bb308b015848a79b88b
+size 4998374296

model-00016-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d3012980b56037e8e12fed54950a2eb7292ba3a2781eeb8c145e55b4fd634761
+size 4998374352

model-00018-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:29db1d88854a27bc49c66d9c9291d12d34bc0940d9f56c32dd974452ed6a835a
+size 4994816584

model-00019-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3acb093da248844c1b9c9e7eec982b736bd4e1257ecdf629896dc69aaa0cf2cc
+size 4998374296

model-00021-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:faf87add52cb1541dffd20ff3344fdd99bf82148afd83487648e189738c3d659
+size 4997437536

model-00022-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:30d08374366e5c697acb051012afa496cc9ba94ac1c1537cb2e9ea0a187ca005
+size 4995753328

model-00023-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4473d5c2515c242b9c8de85761e1f5d812e762b00c7453c32d3eb874b2b12412
+size 4998374296

model-00026-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7bf1bc4d39100c765a6d0c1d9f9ce98ad48687a37ef448d0710c484e8aaf2e4
+size 4998374296

model-00027-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae074a7acf90cd8c9dc35854f48739c0d740be9f441927926904abe49f72e999
+size 4998374296

model-00028-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fceaecdfa64394c356c50647a85b0c8f798ecbc8c014651cbcf658e421c149c7
+size 4998374704

model-00029-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1d64e3e16181650d3f1a46eea53128afd47d0182a88e6e5a79c7500402ed67c1
+size 4994816640

model-00031-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c860a25818818aefc4257636bcaaf9692180d378a76216417722edc4185f98c0
+size 4998374416

model-00032-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cafb9af43f6c4ada1d7c2ee60ca3b605c4813824a679ccf8c55aa972465852f0
+size 4998374704

model-00036-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a427937253b67463803fd8b30ac7495e6e1c30b371497bdcc8a39bed28628a3e
+size 4994816640

model-00038-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2b5402bbdef41082d482f1c7732405960cd439912971e748e2c13bb28ff2fd44
+size 4998374296

model-00039-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93f3ebebbff23b22b6917add391de145f487f2d7dc586e4561119f27b0b20bf8
+size 4998374648

model-00040-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ae146b2d626da2845b00f9d5f000c01d4696ffccfbec2d76d29a0a9da02641cb
+size 4994816624

model-00044-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:002012b1650bbbf60d4fe4751cfa99df40eb4e1a1cbf85517bd0007608d16d87
+size 4994816576

model-00046-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e35484cb15b5113f7ff0d5e04fd322b0f0faa525e6f61058d49229020fd463b
+size 4998374480

model-00047-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:54a97c1f908a8c00eab808d9d0dd09a41939038c67945f360b6d8905f2b06d9f
+size 4979088880

model-00048-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ffe37928357d318e71754917de561c15a0c72dcb1dd9dface0b6f571535b5dc1
+size 4998372632

model-00049-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:42bd5f042706ad310d6e4526526f89b51f27528538927465247be0bd813caabb
+size 4998374296

model-00051-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ca7169513b1dbb516f8ef2b4bc6c232000f40be01299bc83d8538af21b9b9fb3
+size 4994816600

model-00052-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:907a3ebf2e569e5a8683a883bd1ac9b158632acfbdad61c4023787d7c6eebe51
+size 4998374296

model-00054-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dc4abeb456d790a1475ea5686a45f2d561e07dabc6c4b1675b089ad7e0128420
+size 4998374704

model-00056-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22bd5ad18875cde1ca6a121b21841f73ec8fff1bd55e346500065e95089d4fd4
+size 4998374296

model-00059-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:18c8fb4a3d47a93ce939c17c7390a5eb63c6d3e5a5a2a3387509856540aa217c
+size 4994816552

model-00062-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2997a08af88d306c48cf920873b6433f024d22405896db70ca5909e4ce041e57
+size 4994816640

model-00064-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ed2ab2adb49308624499a80f277d544db4a94453de97b1b773ec737b68a78fda
+size 4998374296

model-00067-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eaeaacb52dc313f87381a2a6f32d81d010d0cfd3474bd372fef4ca4216c5b9be
+size 4998374296

model-00069-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8393832ef0dd10d3b3b84073efb418ae04a0c449a063ba2e0c2b821a8fd4b01e
+size 4998374704

model-00071-of-00071.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9609ec3031885825c96641830314c5212c6310a55f2f11e63125a6c55d82f5d7
+size 4636515144

model.safetensors.index.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:067adab1d9864371e6693f328183cd792d07aac46b07731d2aa8d2fcc8e8615f
+size 12337281

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "additional_special_tokens": [
+    "<|endoftext|>",
+    "[MASK]",
+    "[gMASK]",
+    "[sMASK]",
+    "<sop>",
+    "<eop>",
+    "<|system|>",
+    "<|user|>",
+    "<|assistant|>",
+    "<|observation|>",
+    "<|begin_of_image|>",
+    "<|end_of_image|>",
+    "<|begin_of_video|>",
+    "<|end_of_video|>",
+    "<|begin_of_audio|>",
+    "<|end_of_audio|>",
+    "<|begin_of_transcription|>",
+    "<|end_of_transcription|>",
+    "<|code_prefix|>",
+    "<|code_middle|>",
+    "<|code_suffix|>",
+    "/nothink"
+  ],
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|endoftext|>"
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bda8e2146c3bb7b7e0fc96dcc4f0aeff041c6c27952e3ace0665663ebff346ba
+size 19970700