lyy666666 commited on
Commit
1eff3cf
·
verified ·
1 Parent(s): 2baa25e

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/config.json +39 -0
  3. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/generation_config.json +12 -0
  4. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00001-of-00062.safetensors +3 -0
  5. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00002-of-00062.safetensors +3 -0
  6. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00003-of-00062.safetensors +3 -0
  7. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00004-of-00062.safetensors +3 -0
  8. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00005-of-00062.safetensors +3 -0
  9. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00006-of-00062.safetensors +3 -0
  10. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00007-of-00062.safetensors +3 -0
  11. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00008-of-00062.safetensors +3 -0
  12. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00009-of-00062.safetensors +3 -0
  13. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00010-of-00062.safetensors +3 -0
  14. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00011-of-00062.safetensors +3 -0
  15. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00012-of-00062.safetensors +3 -0
  16. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00013-of-00062.safetensors +3 -0
  17. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00014-of-00062.safetensors +3 -0
  18. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00015-of-00062.safetensors +3 -0
  19. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00016-of-00062.safetensors +3 -0
  20. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00017-of-00062.safetensors +3 -0
  21. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00018-of-00062.safetensors +3 -0
  22. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00019-of-00062.safetensors +3 -0
  23. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00020-of-00062.safetensors +3 -0
  24. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00021-of-00062.safetensors +3 -0
  25. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00022-of-00062.safetensors +3 -0
  26. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00023-of-00062.safetensors +3 -0
  27. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00024-of-00062.safetensors +3 -0
  28. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00025-of-00062.safetensors +3 -0
  29. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00026-of-00062.safetensors +3 -0
  30. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00027-of-00062.safetensors +3 -0
  31. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00028-of-00062.safetensors +3 -0
  32. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00029-of-00062.safetensors +3 -0
  33. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00030-of-00062.safetensors +3 -0
  34. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00031-of-00062.safetensors +3 -0
  35. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00032-of-00062.safetensors +3 -0
  36. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00033-of-00062.safetensors +3 -0
  37. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00034-of-00062.safetensors +3 -0
  38. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00035-of-00062.safetensors +3 -0
  39. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00036-of-00062.safetensors +3 -0
  40. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00037-of-00062.safetensors +3 -0
  41. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00038-of-00062.safetensors +3 -0
  42. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00039-of-00062.safetensors +3 -0
  43. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00040-of-00062.safetensors +3 -0
  44. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00041-of-00062.safetensors +3 -0
  45. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00042-of-00062.safetensors +3 -0
  46. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00043-of-00062.safetensors +3 -0
  47. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00044-of-00062.safetensors +3 -0
  48. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00045-of-00062.safetensors +3 -0
  49. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00046-of-00062.safetensors +3 -0
  50. tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00047-of-00062.safetensors +3 -0
.gitattributes CHANGED
@@ -150,3 +150,4 @@ kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_1_512_2e-5/checkpoint-1/to
150
  kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_1_512_2e-5/tokenizer.json filter=lfs diff=lfs merge=lfs -text
151
  kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_10_512_2e-5/checkpoint-1/tokenizer.json filter=lfs diff=lfs merge=lfs -text
152
  kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_10_512_2e-5/tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
150
  kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_1_512_2e-5/tokenizer.json filter=lfs diff=lfs merge=lfs -text
151
  kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_10_512_2e-5/checkpoint-1/tokenizer.json filter=lfs diff=lfs merge=lfs -text
152
  kud-llama3.3-70b_biology_leaf_relearn_klr_gdr_biology_10_512_2e-5/tokenizer.json filter=lfs diff=lfs merge=lfs -text
153
+ tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/tokenizer.json filter=lfs diff=lfs merge=lfs -text
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "LlamaForCausalLM"
4
+ ],
5
+ "attention_bias": false,
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 128000,
8
+ "eos_token_id": [
9
+ 128001,
10
+ 128008,
11
+ 128009
12
+ ],
13
+ "head_dim": 128,
14
+ "hidden_act": "silu",
15
+ "hidden_size": 8192,
16
+ "initializer_range": 0.02,
17
+ "intermediate_size": 28672,
18
+ "max_position_embeddings": 131072,
19
+ "mlp_bias": false,
20
+ "model_type": "llama",
21
+ "num_attention_heads": 64,
22
+ "num_hidden_layers": 80,
23
+ "num_key_value_heads": 8,
24
+ "pretraining_tp": 1,
25
+ "rms_norm_eps": 1e-05,
26
+ "rope_scaling": {
27
+ "factor": 8.0,
28
+ "high_freq_factor": 4.0,
29
+ "low_freq_factor": 1.0,
30
+ "original_max_position_embeddings": 8192,
31
+ "rope_type": "llama3"
32
+ },
33
+ "rope_theta": 500000.0,
34
+ "tie_word_embeddings": false,
35
+ "torch_dtype": "float32",
36
+ "transformers_version": "4.51.0",
37
+ "use_cache": true,
38
+ "vocab_size": 128256
39
+ }
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/generation_config.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 128000,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128008,
7
+ 128009
8
+ ],
9
+ "temperature": 0.6,
10
+ "top_p": 0.9,
11
+ "transformers_version": "4.51.0"
12
+ }
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00001-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab8760b57daa47a88f5e2d8f4beb1f7957d6f22bc251a188fd36773d22022a44
3
+ size 4806672984
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00002-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11e6d95eea8daa94a6aeb0bb3794bce82c2f7e02908d32f17e4450c27d4ba178
3
+ size 4362142864
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00003-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:863f478048f60de0a6c80f898290f8d4c0645679c66ee0d8df270c708ad538d8
3
+ size 4362142864
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00004-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:846697b30627f924e14de749879665d9ab0a9c288480be3ee2ce8889975cff64
3
+ size 4966188864
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00005-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d720ec4fa58eb8ea4caa8724bedb1797ae2069bc30b6fa4fb0b87f61b7962fe0
3
+ size 4362142864
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00006-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a423dcb8bd0a72cc95e5b232cbbfd8dc3e6a8b0208e1e3cd07e792eab7b18884
3
+ size 4362142864
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00007-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e1205cc6a0494010b4ee729f1477431a8c2e5a954bdac498cf42767d3f2d077
3
+ size 4966188864
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00008-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:341aae64f6f692f6376dfa089a41c27099de668487ac6459405d5b08c595828e
3
+ size 4362142864
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00009-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54103b1c2e7b751ddd66d7b130b4a866509dd886ed1cf843eee0e88443a2146f
3
+ size 4362142880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00010-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdc56f71aac4f12d91ab4a89d6361effef2e9a1ac9b795680834c77c5eb9a14f
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00011-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79f7b7a720826bc464f01881f25dad3cbec0159bca6fb51a95ea438031400e82
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00012-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0a2b680b622b1324cdbc42009e05a3176bc13dcab8e2a23b83aeb30b221babd
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00013-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:418ee77d381c8551cf6d2f56654903a69e79d7f7db9664ff249588c17c484827
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00014-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cd846be5a0e952ddd0559ce2ec69a11d3f0087f2a5e505886d1f26a0ef43cfc
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00015-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17c04e25eba3d8adc9d0bb10b2b5e6b07c71eb6fb620561a172fe58b4571d9fe
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00016-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69a95d6d924e13561a0647afb3afa9108581a0f7e27856ce4bbb96b9aace23a9
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00017-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f18ab0f52874637926d73372179b58a0710f9c780f90d49c2ab3c1265e2618cf
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00018-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2a11a51abbac1d7f2fa27263ee8c2488cb82368dbadbff0ab2509fa18222684
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00019-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16b1325b2272f4eeba5caff59c353b7bd76e300a02c2c2d5ab29dc5b9de27ae5
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00020-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbfb4c73df9f7e63376e2a36836d15a38707147bc2331a2401ea2082936248af
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00021-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e337a2a22db38640ded42255c725fd39d9ced4e2d2815578e4001d5fdd947646
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00022-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8906e6ab5e8c39c6549a06a37ac37f974d1faa5fb22c3a0239bf352d1b8f017
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00023-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb57b2f1f57fd6a9072383d5e0118adfecdff1a9a568c108120c5fa46faf2b70
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00024-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a97d8d8812560d4aa90d5470c841bbcbb3f82ffc24920960fb03f1f110374fff
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00025-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb98edee2bb755f367a4c55221376551afc70aa4aab02be2104b61f603d4e6b6
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00026-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d64edc6bfdcbf2eb87b1ae7a5ab97e7b3c9c5661d3aff7fbb948e30f6f63d4b
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00027-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:599afebc5a4582a0f42d93dbf9a2b42083c1714762cc14f6f4becdcbada90d57
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00028-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58f653671a01ce3b3f6d4941a152b229402aca491c989dd10c8ccca4307cc0a2
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00029-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a57bcab2c26c59be85a49ec9e0505ff3948b52453e82c1e9bd35cd9d0de4c0a5
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00030-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:068e6407c53f010f334e7012f17c2671e131b080dd9252b9e7a11590edf98340
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00031-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2a7fbd100427bdcc996fd4ec5c202004ca39410b5d53c2fc4c67202ec9b7f15
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00032-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:624f42db0fc067e6c7e6fd505c5e16ef88b6c5325767a3bb6e6752f72c204c70
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00033-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5541b70eb08131392b128720ad687875bf0e3bc6ade9d2cc7b24f2eb6a28de29
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00034-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79895877421507febb66cf43bc3fb8662b3775a652ae84d88aa5f1bd2ba55326
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00035-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9018f3055282147860a087627e7bdf57187f9a41e97f4e804833bc8b649af46d
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00036-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2840f6aee3cf841f6dd1379b36485d3ed3161f7c0e630b1c27bec4adb47665d9
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00037-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:020a17c50b60dcb3b01491c651285c3b9ebd76af126fd17c23ba249bd1b27f11
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00038-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87330900bfa02c6a4d54d5e693dbfb0044d9a9cae41f2c4c82d790e4bd5a2b41
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00039-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e05289f90da632c426dce5c6ec9faed6e2d139fee0cfaca8693e798c84cfe236
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00040-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2324cb9bc2ce4cbf955c4360032cdda2fe2003856721d834783359ca9bab18e5
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00041-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f70749d4091e550548364f275e620dc3d7742477ae75e7e7239e1494aa880ad
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00042-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93eeb5af13001151698ca6700c507061f123d45e81ed840d325084c0d82ecc2a
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00043-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ad00977bc50bcb91b9aa64bdf584fcf0df19f32b93868a31896e6e6c2e30073
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00044-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59c63984af21ce45427ef3d25d92d6e0326b27b1fea133b7b6231fd0c1d11b5a
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00045-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f65352030885661ece8223e5b9e1d79a7f4b147ef6b59ab787d0063ea5cac152
3
+ size 4362142872
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00046-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd50676af6d253ed68495785424fcdc2517ea050baff2184d99cf30c2b42016e
3
+ size 4966188880
tmp/kud-llama3.3-70b_history_leaf_relearn_klr_gdr_history_10000_512_2e-5/checkpoint-1250-full/model-00047-of-00062.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11f867eb6b955a77ed6cc79fcd3f7a9607f56529497eeb9336f961a287a844b4
3
+ size 4362142872