Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/config.json +39 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/generation_config.json +12 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00001-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00002-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00003-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00004-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00005-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00006-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00007-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00008-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00009-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00010-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00011-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00012-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00013-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00014-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00015-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00016-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00017-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00018-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00019-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00020-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00021-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00022-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00023-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00024-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00025-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00026-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00027-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00028-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00029-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00030-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00031-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00032-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00033-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00034-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00035-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00036-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00037-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00038-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00039-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00040-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00041-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00042-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00043-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00044-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00045-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00046-of-00062.safetensors +3 -0
- tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00047-of-00062.safetensors +3 -0
.gitattributes
CHANGED
|
@@ -150,3 +150,4 @@ kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_1_512_2e-5/checkpoint-1/to
|
|
| 150 |
kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_1_512_2e-5/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 151 |
kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_10_512_2e-5/checkpoint-1/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 152 |
kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_10_512_2e-5/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 150 |
kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_1_512_2e-5/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 151 |
kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_10_512_2e-5/checkpoint-1/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 152 |
kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_10_512_2e-5/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 153 |
+
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/config.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"LlamaForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_bias": false,
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"bos_token_id": 128000,
|
| 8 |
+
"eos_token_id": [
|
| 9 |
+
128001,
|
| 10 |
+
128008,
|
| 11 |
+
128009
|
| 12 |
+
],
|
| 13 |
+
"head_dim": 128,
|
| 14 |
+
"hidden_act": "silu",
|
| 15 |
+
"hidden_size": 8192,
|
| 16 |
+
"initializer_range": 0.02,
|
| 17 |
+
"intermediate_size": 28672,
|
| 18 |
+
"max_position_embeddings": 131072,
|
| 19 |
+
"mlp_bias": false,
|
| 20 |
+
"model_type": "llama",
|
| 21 |
+
"num_attention_heads": 64,
|
| 22 |
+
"num_hidden_layers": 80,
|
| 23 |
+
"num_key_value_heads": 8,
|
| 24 |
+
"pretraining_tp": 1,
|
| 25 |
+
"rms_norm_eps": 1e-05,
|
| 26 |
+
"rope_scaling": {
|
| 27 |
+
"factor": 8.0,
|
| 28 |
+
"high_freq_factor": 4.0,
|
| 29 |
+
"low_freq_factor": 1.0,
|
| 30 |
+
"original_max_position_embeddings": 8192,
|
| 31 |
+
"rope_type": "llama3"
|
| 32 |
+
},
|
| 33 |
+
"rope_theta": 500000.0,
|
| 34 |
+
"tie_word_embeddings": false,
|
| 35 |
+
"torch_dtype": "float32",
|
| 36 |
+
"transformers_version": "4.51.0",
|
| 37 |
+
"use_cache": true,
|
| 38 |
+
"vocab_size": 128256
|
| 39 |
+
}
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/generation_config.json
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token_id": 128000,
|
| 3 |
+
"do_sample": true,
|
| 4 |
+
"eos_token_id": [
|
| 5 |
+
128001,
|
| 6 |
+
128008,
|
| 7 |
+
128009
|
| 8 |
+
],
|
| 9 |
+
"temperature": 0.6,
|
| 10 |
+
"top_p": 0.9,
|
| 11 |
+
"transformers_version": "4.51.0"
|
| 12 |
+
}
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00001-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ab8760b57daa47a88f5e2d8f4beb1f7957d6f22bc251a188fd36773d22022a44
|
| 3 |
+
size 4806672984
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00002-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11e6d95eea8daa94a6aeb0bb3794bce82c2f7e02908d32f17e4450c27d4ba178
|
| 3 |
+
size 4362142864
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00003-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:863f478048f60de0a6c80f898290f8d4c0645679c66ee0d8df270c708ad538d8
|
| 3 |
+
size 4362142864
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00004-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:846697b30627f924e14de749879665d9ab0a9c288480be3ee2ce8889975cff64
|
| 3 |
+
size 4966188864
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00005-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d720ec4fa58eb8ea4caa8724bedb1797ae2069bc30b6fa4fb0b87f61b7962fe0
|
| 3 |
+
size 4362142864
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00006-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a423dcb8bd0a72cc95e5b232cbbfd8dc3e6a8b0208e1e3cd07e792eab7b18884
|
| 3 |
+
size 4362142864
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00007-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e1205cc6a0494010b4ee729f1477431a8c2e5a954bdac498cf42767d3f2d077
|
| 3 |
+
size 4966188864
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00008-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:341aae64f6f692f6376dfa089a41c27099de668487ac6459405d5b08c595828e
|
| 3 |
+
size 4362142864
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00009-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:54103b1c2e7b751ddd66d7b130b4a866509dd886ed1cf843eee0e88443a2146f
|
| 3 |
+
size 4362142880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00010-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bdc56f71aac4f12d91ab4a89d6361effef2e9a1ac9b795680834c77c5eb9a14f
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00011-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79f7b7a720826bc464f01881f25dad3cbec0159bca6fb51a95ea438031400e82
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00012-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0a2b680b622b1324cdbc42009e05a3176bc13dcab8e2a23b83aeb30b221babd
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00013-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:418ee77d381c8551cf6d2f56654903a69e79d7f7db9664ff249588c17c484827
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00014-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3cd846be5a0e952ddd0559ce2ec69a11d3f0087f2a5e505886d1f26a0ef43cfc
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00015-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17c04e25eba3d8adc9d0bb10b2b5e6b07c71eb6fb620561a172fe58b4571d9fe
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00016-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69a95d6d924e13561a0647afb3afa9108581a0f7e27856ce4bbb96b9aace23a9
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00017-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f18ab0f52874637926d73372179b58a0710f9c780f90d49c2ab3c1265e2618cf
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00018-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b2a11a51abbac1d7f2fa27263ee8c2488cb82368dbadbff0ab2509fa18222684
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00019-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:16b1325b2272f4eeba5caff59c353b7bd76e300a02c2c2d5ab29dc5b9de27ae5
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00020-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bbfb4c73df9f7e63376e2a36836d15a38707147bc2331a2401ea2082936248af
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00021-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e337a2a22db38640ded42255c725fd39d9ced4e2d2815578e4001d5fdd947646
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00022-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8906e6ab5e8c39c6549a06a37ac37f974d1faa5fb22c3a0239bf352d1b8f017
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00023-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb57b2f1f57fd6a9072383d5e0118adfecdff1a9a568c108120c5fa46faf2b70
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00024-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a97d8d8812560d4aa90d5470c841bbcbb3f82ffc24920960fb03f1f110374fff
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00025-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb98edee2bb755f367a4c55221376551afc70aa4aab02be2104b61f603d4e6b6
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00026-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d64edc6bfdcbf2eb87b1ae7a5ab97e7b3c9c5661d3aff7fbb948e30f6f63d4b
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00027-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:599afebc5a4582a0f42d93dbf9a2b42083c1714762cc14f6f4becdcbada90d57
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00028-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:58f653671a01ce3b3f6d4941a152b229402aca491c989dd10c8ccca4307cc0a2
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00029-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a57bcab2c26c59be85a49ec9e0505ff3948b52453e82c1e9bd35cd9d0de4c0a5
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00030-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:068e6407c53f010f334e7012f17c2671e131b080dd9252b9e7a11590edf98340
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00031-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2a7fbd100427bdcc996fd4ec5c202004ca39410b5d53c2fc4c67202ec9b7f15
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00032-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:624f42db0fc067e6c7e6fd505c5e16ef88b6c5325767a3bb6e6752f72c204c70
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00033-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5541b70eb08131392b128720ad687875bf0e3bc6ade9d2cc7b24f2eb6a28de29
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00034-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79895877421507febb66cf43bc3fb8662b3775a652ae84d88aa5f1bd2ba55326
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00035-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9018f3055282147860a087627e7bdf57187f9a41e97f4e804833bc8b649af46d
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00036-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2840f6aee3cf841f6dd1379b36485d3ed3161f7c0e630b1c27bec4adb47665d9
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00037-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:020a17c50b60dcb3b01491c651285c3b9ebd76af126fd17c23ba249bd1b27f11
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00038-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:87330900bfa02c6a4d54d5e693dbfb0044d9a9cae41f2c4c82d790e4bd5a2b41
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00039-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e05289f90da632c426dce5c6ec9faed6e2d139fee0cfaca8693e798c84cfe236
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00040-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2324cb9bc2ce4cbf955c4360032cdda2fe2003856721d834783359ca9bab18e5
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00041-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f70749d4091e550548364f275e620dc3d7742477ae75e7e7239e1494aa880ad
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00042-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:93eeb5af13001151698ca6700c507061f123d45e81ed840d325084c0d82ecc2a
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00043-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ad00977bc50bcb91b9aa64bdf584fcf0df19f32b93868a31896e6e6c2e30073
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00044-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59c63984af21ce45427ef3d25d92d6e0326b27b1fea133b7b6231fd0c1d11b5a
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00045-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f65352030885661ece8223e5b9e1d79a7f4b147ef6b59ab787d0063ea5cac152
|
| 3 |
+
size 4362142872
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00046-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd50676af6d253ed68495785424fcdc2517ea050baff2184d99cf30c2b42016e
|
| 3 |
+
size 4966188880
|
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00047-of-00062.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11f867eb6b955a77ed6cc79fcd3f7a9607f56529497eeb9336f961a287a844b4
|
| 3 |
+
size 4362142872
|