Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +2 -0
- chat_template.jinja +86 -0
- config.json +77 -0
- generation_config.json +11 -0
- hf_quant_config.json +14 -0
- model-00001-of-00071.safetensors +3 -0
- model-00002-of-00071.safetensors +3 -0
- model-00003-of-00071.safetensors +3 -0
- model-00004-of-00071.safetensors +3 -0
- model-00006-of-00071.safetensors +3 -0
- model-00007-of-00071.safetensors +3 -0
- model-00010-of-00071.safetensors +3 -0
- model-00011-of-00071.safetensors +3 -0
- model-00012-of-00071.safetensors +3 -0
- model-00014-of-00071.safetensors +3 -0
- model-00015-of-00071.safetensors +3 -0
- model-00016-of-00071.safetensors +3 -0
- model-00018-of-00071.safetensors +3 -0
- model-00019-of-00071.safetensors +3 -0
- model-00021-of-00071.safetensors +3 -0
- model-00022-of-00071.safetensors +3 -0
- model-00023-of-00071.safetensors +3 -0
- model-00026-of-00071.safetensors +3 -0
- model-00027-of-00071.safetensors +3 -0
- model-00028-of-00071.safetensors +3 -0
- model-00029-of-00071.safetensors +3 -0
- model-00031-of-00071.safetensors +3 -0
- model-00032-of-00071.safetensors +3 -0
- model-00036-of-00071.safetensors +3 -0
- model-00038-of-00071.safetensors +3 -0
- model-00039-of-00071.safetensors +3 -0
- model-00040-of-00071.safetensors +3 -0
- model-00044-of-00071.safetensors +3 -0
- model-00046-of-00071.safetensors +3 -0
- model-00047-of-00071.safetensors +3 -0
- model-00048-of-00071.safetensors +3 -0
- model-00049-of-00071.safetensors +3 -0
- model-00051-of-00071.safetensors +3 -0
- model-00052-of-00071.safetensors +3 -0
- model-00054-of-00071.safetensors +3 -0
- model-00056-of-00071.safetensors +3 -0
- model-00059-of-00071.safetensors +3 -0
- model-00062-of-00071.safetensors +3 -0
- model-00064-of-00071.safetensors +3 -0
- model-00067-of-00071.safetensors +3 -0
- model-00069-of-00071.safetensors +3 -0
- model-00071-of-00071.safetensors +3 -0
- model.safetensors.index.json +3 -0
- special_tokens_map.json +34 -0
- tokenizer.json +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
model.safetensors.index.json filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
chat_template.jinja
ADDED
|
@@ -0,0 +1,86 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[gMASK]<sop>
|
| 2 |
+
{%- if tools -%}
|
| 3 |
+
<|system|>
|
| 4 |
+
# Tools
|
| 5 |
+
|
| 6 |
+
You may call one or more functions to assist with the user query.
|
| 7 |
+
|
| 8 |
+
You are provided with function signatures within <tools></tools> XML tags:
|
| 9 |
+
<tools>
|
| 10 |
+
{% for tool in tools %}
|
| 11 |
+
{{ tool | tojson(ensure_ascii=False) }}
|
| 12 |
+
{% endfor %}
|
| 13 |
+
</tools>
|
| 14 |
+
|
| 15 |
+
For each function call, output the function name and arguments within the following XML format:
|
| 16 |
+
<tool_call>{function-name}<arg_key>{arg-key-1}</arg_key><arg_value>{arg-value-1}</arg_value><arg_key>{arg-key-2}</arg_key><arg_value>{arg-value-2}</arg_value>...</tool_call>{%- endif -%}
|
| 17 |
+
{%- macro visible_text(content) -%}
|
| 18 |
+
{%- if content is string -%}
|
| 19 |
+
{{- content }}
|
| 20 |
+
{%- elif content is iterable and content is not mapping -%}
|
| 21 |
+
{%- for item in content -%}
|
| 22 |
+
{%- if item is mapping and item.type == 'text' -%}
|
| 23 |
+
{{- item.text }}
|
| 24 |
+
{%- elif item is string -%}
|
| 25 |
+
{{- item }}
|
| 26 |
+
{%- endif -%}
|
| 27 |
+
{%- endfor -%}
|
| 28 |
+
{%- else -%}
|
| 29 |
+
{{- content }}
|
| 30 |
+
{%- endif -%}
|
| 31 |
+
{%- endmacro -%}
|
| 32 |
+
{%- set ns = namespace(last_user_index=-1) %}
|
| 33 |
+
{%- for m in messages %}
|
| 34 |
+
{%- if m.role == 'user' %}
|
| 35 |
+
{% set ns.last_user_index = loop.index0 -%}
|
| 36 |
+
{%- endif %}
|
| 37 |
+
{%- endfor %}
|
| 38 |
+
{% for m in messages %}
|
| 39 |
+
{%- if m.role == 'user' -%}<|user|>{{ visible_text(m.content) }}
|
| 40 |
+
{%- elif m.role == 'assistant' -%}
|
| 41 |
+
<|assistant|>
|
| 42 |
+
{%- set reasoning_content = '' %}
|
| 43 |
+
{%- set content = visible_text(m.content) %}
|
| 44 |
+
{%- if m.reasoning_content is string %}
|
| 45 |
+
{%- set reasoning_content = m.reasoning_content %}
|
| 46 |
+
{%- else %}
|
| 47 |
+
{%- if '</think>' in content %}
|
| 48 |
+
{%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
|
| 49 |
+
{%- set content = content.split('</think>')[-1].lstrip('\n') %}
|
| 50 |
+
{%- endif %}
|
| 51 |
+
{%- endif %}
|
| 52 |
+
{%- if ((clear_thinking is defined and not clear_thinking) or loop.index0 > ns.last_user_index) and reasoning_content -%}
|
| 53 |
+
{{ '<think>' + reasoning_content.strip() + '</think>'}}
|
| 54 |
+
{%- else -%}
|
| 55 |
+
{{ '</think>' }}
|
| 56 |
+
{%- endif -%}
|
| 57 |
+
{%- if content.strip() -%}
|
| 58 |
+
{{ content.strip() }}
|
| 59 |
+
{%- endif -%}
|
| 60 |
+
{% if m.tool_calls %}
|
| 61 |
+
{% for tc in m.tool_calls %}
|
| 62 |
+
{%- if tc.function %}
|
| 63 |
+
{%- set tc = tc.function %}
|
| 64 |
+
{%- endif %}
|
| 65 |
+
{{- '<tool_call>' + tc.name -}}
|
| 66 |
+
{% set _args = tc.arguments %}{% for k, v in _args.items() %}<arg_key>{{ k }}</arg_key><arg_value>{{ v | tojson(ensure_ascii=False) if v is not string else v }}</arg_value>{% endfor %}</tool_call>{% endfor %}
|
| 67 |
+
{% endif %}
|
| 68 |
+
{%- elif m.role == 'tool' -%}
|
| 69 |
+
{%- if m.content is string -%}
|
| 70 |
+
{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
|
| 71 |
+
{{- '<|observation|>' }}
|
| 72 |
+
{%- endif %}
|
| 73 |
+
{{- '<tool_response>' }}
|
| 74 |
+
{{- m.content }}
|
| 75 |
+
{{- '</tool_response>' }}
|
| 76 |
+
{%- else -%}
|
| 77 |
+
<|observation|>{% for tr in m.content %}
|
| 78 |
+
<tool_response>{{ tr.output if tr.output is defined else tr }}</tool_response>{% endfor -%}
|
| 79 |
+
{% endif -%}
|
| 80 |
+
{%- elif m.role == 'system' -%}
|
| 81 |
+
<|system|>{{ visible_text(m.content) }}
|
| 82 |
+
{%- endif -%}
|
| 83 |
+
{%- endfor -%}
|
| 84 |
+
{%- if add_generation_prompt -%}
|
| 85 |
+
<|assistant|>{{- '</think>' if (enable_thinking is defined and not enable_thinking) else '<think>' -}}
|
| 86 |
+
{%- endif -%}
|
config.json
ADDED
|
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"Glm4MoeForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_bias": true,
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"dtype": "bfloat16",
|
| 8 |
+
"eos_token_id": [
|
| 9 |
+
151329,
|
| 10 |
+
151336,
|
| 11 |
+
151338
|
| 12 |
+
],
|
| 13 |
+
"first_k_dense_replace": 3,
|
| 14 |
+
"head_dim": 128,
|
| 15 |
+
"hidden_act": "silu",
|
| 16 |
+
"hidden_size": 5120,
|
| 17 |
+
"initializer_range": 0.02,
|
| 18 |
+
"intermediate_size": 12288,
|
| 19 |
+
"max_position_embeddings": 202752,
|
| 20 |
+
"model_type": "glm4_moe",
|
| 21 |
+
"moe_intermediate_size": 1536,
|
| 22 |
+
"n_group": 1,
|
| 23 |
+
"n_routed_experts": 160,
|
| 24 |
+
"n_shared_experts": 1,
|
| 25 |
+
"norm_topk_prob": true,
|
| 26 |
+
"num_attention_heads": 96,
|
| 27 |
+
"num_experts_per_tok": 8,
|
| 28 |
+
"num_hidden_layers": 92,
|
| 29 |
+
"num_key_value_heads": 8,
|
| 30 |
+
"num_nextn_predict_layers": 1,
|
| 31 |
+
"pad_token_id": 151329,
|
| 32 |
+
"partial_rotary_factor": 0.5,
|
| 33 |
+
"rms_norm_eps": 1e-05,
|
| 34 |
+
"rope_scaling": null,
|
| 35 |
+
"rope_theta": 1000000,
|
| 36 |
+
"routed_scaling_factor": 2.5,
|
| 37 |
+
"tie_word_embeddings": false,
|
| 38 |
+
"topk_group": 1,
|
| 39 |
+
"transformers_version": "4.57.1",
|
| 40 |
+
"use_cache": true,
|
| 41 |
+
"use_qk_norm": true,
|
| 42 |
+
"vocab_size": 151552,
|
| 43 |
+
"quantization_config": {
|
| 44 |
+
"config_groups": {
|
| 45 |
+
"group_0": {
|
| 46 |
+
"input_activations": {
|
| 47 |
+
"dynamic": false,
|
| 48 |
+
"num_bits": 8,
|
| 49 |
+
"type": "float"
|
| 50 |
+
},
|
| 51 |
+
"weights": {
|
| 52 |
+
"dynamic": false,
|
| 53 |
+
"num_bits": 8,
|
| 54 |
+
"type": "float"
|
| 55 |
+
},
|
| 56 |
+
"targets": [
|
| 57 |
+
"Linear"
|
| 58 |
+
]
|
| 59 |
+
}
|
| 60 |
+
},
|
| 61 |
+
"ignore": [
|
| 62 |
+
"lm_head",
|
| 63 |
+
"model.layers.92*"
|
| 64 |
+
],
|
| 65 |
+
"quant_algo": "FP8",
|
| 66 |
+
"kv_cache_scheme": {
|
| 67 |
+
"dynamic": false,
|
| 68 |
+
"num_bits": 8,
|
| 69 |
+
"type": "float"
|
| 70 |
+
},
|
| 71 |
+
"producer": {
|
| 72 |
+
"name": "modelopt",
|
| 73 |
+
"version": "0.42.0rc1.dev9+ge53ca61b7"
|
| 74 |
+
},
|
| 75 |
+
"quant_method": "modelopt"
|
| 76 |
+
}
|
| 77 |
+
}
|
generation_config.json
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_from_model_config": true,
|
| 3 |
+
"eos_token_id": [
|
| 4 |
+
151329,
|
| 5 |
+
151336,
|
| 6 |
+
151338
|
| 7 |
+
],
|
| 8 |
+
"pad_token_id": 151329,
|
| 9 |
+
"temperature": 1.0,
|
| 10 |
+
"transformers_version": "4.56.2"
|
| 11 |
+
}
|
hf_quant_config.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"producer": {
|
| 3 |
+
"name": "modelopt",
|
| 4 |
+
"version": "0.42.0rc1.dev9+ge53ca61b7"
|
| 5 |
+
},
|
| 6 |
+
"quantization": {
|
| 7 |
+
"quant_algo": "FP8",
|
| 8 |
+
"kv_cache_quant_algo": "FP8",
|
| 9 |
+
"exclude_modules": [
|
| 10 |
+
"lm_head",
|
| 11 |
+
"model.layers.92*"
|
| 12 |
+
]
|
| 13 |
+
}
|
| 14 |
+
}
|
model-00001-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a9fe7e2a9f7ae1423b3c67f1038d4484437628a9df0e85091894b1428966cc0
|
| 3 |
+
size 4999379848
|
model-00002-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4399dba86b3ffbcf79f757eabc381ac08525119ebc31cbb733da44542fcdb12
|
| 3 |
+
size 4998372816
|
model-00003-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c4906e51155ec8aeacd93d6bef0eb7b170fd403cb42fbae1b4d907b098083c1a
|
| 3 |
+
size 4994814792
|
model-00004-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ea6fcf69bfe7893f2d72f20524b22829ca7a534a02ee9e1c06f5d49134d1791
|
| 3 |
+
size 4998372416
|
model-00006-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86ed4fd8fc5777b046e58bdeffa91375547ba3f0e275d58fb8b030ab5e16d420
|
| 3 |
+
size 4998372824
|
model-00007-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11c762199b9941a2d014ceb111826b9a66aab16217f04f6d8eee3d3b5fa20abd
|
| 3 |
+
size 4994816176
|
model-00010-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e4162684af6e7d33b55fa66fdced487ed64298a4095df4752953b6d7b54c037
|
| 3 |
+
size 4994816648
|
model-00011-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:266af5abb658587ca21d23f0b50dc6752471d47ed489cda75b4e68849844adc3
|
| 3 |
+
size 4998374232
|
model-00012-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:883202738bd8fecb14b45512d1446cb40c00f035e17744aede260e52cce028e6
|
| 3 |
+
size 4998374296
|
model-00014-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb0266602d75db7623b31d9b30b1a36a795ce5992fa59e3a43916fb3711dc278
|
| 3 |
+
size 4994816624
|
model-00015-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:216561e9da7eee80b5b3c82d78eb1867bb884508892c7bb308b015848a79b88b
|
| 3 |
+
size 4998374296
|
model-00016-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3012980b56037e8e12fed54950a2eb7292ba3a2781eeb8c145e55b4fd634761
|
| 3 |
+
size 4998374352
|
model-00018-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29db1d88854a27bc49c66d9c9291d12d34bc0940d9f56c32dd974452ed6a835a
|
| 3 |
+
size 4994816584
|
model-00019-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3acb093da248844c1b9c9e7eec982b736bd4e1257ecdf629896dc69aaa0cf2cc
|
| 3 |
+
size 4998374296
|
model-00021-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:faf87add52cb1541dffd20ff3344fdd99bf82148afd83487648e189738c3d659
|
| 3 |
+
size 4997437536
|
model-00022-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30d08374366e5c697acb051012afa496cc9ba94ac1c1537cb2e9ea0a187ca005
|
| 3 |
+
size 4995753328
|
model-00023-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4473d5c2515c242b9c8de85761e1f5d812e762b00c7453c32d3eb874b2b12412
|
| 3 |
+
size 4998374296
|
model-00026-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7bf1bc4d39100c765a6d0c1d9f9ce98ad48687a37ef448d0710c484e8aaf2e4
|
| 3 |
+
size 4998374296
|
model-00027-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae074a7acf90cd8c9dc35854f48739c0d740be9f441927926904abe49f72e999
|
| 3 |
+
size 4998374296
|
model-00028-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fceaecdfa64394c356c50647a85b0c8f798ecbc8c014651cbcf658e421c149c7
|
| 3 |
+
size 4998374704
|
model-00029-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d64e3e16181650d3f1a46eea53128afd47d0182a88e6e5a79c7500402ed67c1
|
| 3 |
+
size 4994816640
|
model-00031-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c860a25818818aefc4257636bcaaf9692180d378a76216417722edc4185f98c0
|
| 3 |
+
size 4998374416
|
model-00032-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cafb9af43f6c4ada1d7c2ee60ca3b605c4813824a679ccf8c55aa972465852f0
|
| 3 |
+
size 4998374704
|
model-00036-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a427937253b67463803fd8b30ac7495e6e1c30b371497bdcc8a39bed28628a3e
|
| 3 |
+
size 4994816640
|
model-00038-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b5402bbdef41082d482f1c7732405960cd439912971e748e2c13bb28ff2fd44
|
| 3 |
+
size 4998374296
|
model-00039-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93f3ebebbff23b22b6917add391de145f487f2d7dc586e4561119f27b0b20bf8
|
| 3 |
+
size 4998374648
|
model-00040-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae146b2d626da2845b00f9d5f000c01d4696ffccfbec2d76d29a0a9da02641cb
|
| 3 |
+
size 4994816624
|
model-00044-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:002012b1650bbbf60d4fe4751cfa99df40eb4e1a1cbf85517bd0007608d16d87
|
| 3 |
+
size 4994816576
|
model-00046-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e35484cb15b5113f7ff0d5e04fd322b0f0faa525e6f61058d49229020fd463b
|
| 3 |
+
size 4998374480
|
model-00047-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:54a97c1f908a8c00eab808d9d0dd09a41939038c67945f360b6d8905f2b06d9f
|
| 3 |
+
size 4979088880
|
model-00048-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ffe37928357d318e71754917de561c15a0c72dcb1dd9dface0b6f571535b5dc1
|
| 3 |
+
size 4998372632
|
model-00049-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:42bd5f042706ad310d6e4526526f89b51f27528538927465247be0bd813caabb
|
| 3 |
+
size 4998374296
|
model-00051-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca7169513b1dbb516f8ef2b4bc6c232000f40be01299bc83d8538af21b9b9fb3
|
| 3 |
+
size 4994816600
|
model-00052-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:907a3ebf2e569e5a8683a883bd1ac9b158632acfbdad61c4023787d7c6eebe51
|
| 3 |
+
size 4998374296
|
model-00054-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc4abeb456d790a1475ea5686a45f2d561e07dabc6c4b1675b089ad7e0128420
|
| 3 |
+
size 4998374704
|
model-00056-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22bd5ad18875cde1ca6a121b21841f73ec8fff1bd55e346500065e95089d4fd4
|
| 3 |
+
size 4998374296
|
model-00059-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18c8fb4a3d47a93ce939c17c7390a5eb63c6d3e5a5a2a3387509856540aa217c
|
| 3 |
+
size 4994816552
|
model-00062-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2997a08af88d306c48cf920873b6433f024d22405896db70ca5909e4ce041e57
|
| 3 |
+
size 4994816640
|
model-00064-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed2ab2adb49308624499a80f277d544db4a94453de97b1b773ec737b68a78fda
|
| 3 |
+
size 4998374296
|
model-00067-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eaeaacb52dc313f87381a2a6f32d81d010d0cfd3474bd372fef4ca4216c5b9be
|
| 3 |
+
size 4998374296
|
model-00069-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8393832ef0dd10d3b3b84073efb418ae04a0c449a063ba2e0c2b821a8fd4b01e
|
| 3 |
+
size 4998374704
|
model-00071-of-00071.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9609ec3031885825c96641830314c5212c6310a55f2f11e63125a6c55d82f5d7
|
| 3 |
+
size 4636515144
|
model.safetensors.index.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:067adab1d9864371e6693f328183cd792d07aac46b07731d2aa8d2fcc8e8615f
|
| 3 |
+
size 12337281
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"additional_special_tokens": [
|
| 3 |
+
"<|endoftext|>",
|
| 4 |
+
"[MASK]",
|
| 5 |
+
"[gMASK]",
|
| 6 |
+
"[sMASK]",
|
| 7 |
+
"<sop>",
|
| 8 |
+
"<eop>",
|
| 9 |
+
"<|system|>",
|
| 10 |
+
"<|user|>",
|
| 11 |
+
"<|assistant|>",
|
| 12 |
+
"<|observation|>",
|
| 13 |
+
"<|begin_of_image|>",
|
| 14 |
+
"<|end_of_image|>",
|
| 15 |
+
"<|begin_of_video|>",
|
| 16 |
+
"<|end_of_video|>",
|
| 17 |
+
"<|begin_of_audio|>",
|
| 18 |
+
"<|end_of_audio|>",
|
| 19 |
+
"<|begin_of_transcription|>",
|
| 20 |
+
"<|end_of_transcription|>",
|
| 21 |
+
"<|code_prefix|>",
|
| 22 |
+
"<|code_middle|>",
|
| 23 |
+
"<|code_suffix|>",
|
| 24 |
+
"/nothink"
|
| 25 |
+
],
|
| 26 |
+
"eos_token": {
|
| 27 |
+
"content": "<|endoftext|>",
|
| 28 |
+
"lstrip": false,
|
| 29 |
+
"normalized": false,
|
| 30 |
+
"rstrip": false,
|
| 31 |
+
"single_word": false
|
| 32 |
+
},
|
| 33 |
+
"pad_token": "<|endoftext|>"
|
| 34 |
+
}
|
tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bda8e2146c3bb7b7e0fc96dcc4f0aeff041c6c27952e3ace0665663ebff346ba
|
| 3 |
+
size 19970700
|