Model save

Files changed (7) hide show

README.md CHANGED Viewed

@@ -27,7 +27,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/nlee28/cross1/runs/xy6a6e5k)
 This model was trained with SFT.

 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/nlee28/cross1/runs/5v45jg0w)
 This model was trained with SFT.

all_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "total_flos": 192705258979328.0,
-    "train_loss": 0.3476698352740361,
-    "train_runtime": 3370.7423,
     "train_samples": 817,
-    "train_samples_per_second": 3.151,
     "train_steps_per_second": 0.1
 }

 {
     "total_flos": 192705258979328.0,
+    "train_loss": 0.34760819860464015,
+    "train_runtime": 3369.3955,
     "train_samples": 817,
+    "train_samples_per_second": 3.152,
     "train_steps_per_second": 0.1
 }

config.json CHANGED Viewed

@@ -22,7 +22,7 @@
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.52.4",
-  "use_cache": true,
   "use_mrope": false,
   "use_sliding_window": false,
   "vocab_size": 151936

   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.52.4",
+  "use_cache": false,
   "use_mrope": false,
   "use_sliding_window": false,
   "vocab_size": 151936

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:76c46c0d42e828d2bf23891ab3486bfd0820576f71bf5c160c2ab689162ab81b
 size 3554214752

 version https://git-lfs.github.com/spec/v1
+oid sha256:841494b3e356a5e876134b6247ecc8b599f9393e453d3ca70404fdf1966e813d
 size 3554214752

runs/Aug13_21-47-25_al-clops-debugging-pipeline-4nn6w-ac6d-0/events.out.tfevents.1755121657.al-clops-debugging-pipeline-4nn6w-ac6d-0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c37b38bc5f04a5d98159c70e30b8a0646eb0177ab8d3cdb853ac7fa6a6f04a3b
+size 50487

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "total_flos": 192705258979328.0,
-    "train_loss": 0.3476698352740361,
-    "train_runtime": 3370.7423,
     "train_samples": 817,
-    "train_samples_per_second": 3.151,
     "train_steps_per_second": 0.1
 }

 {
     "total_flos": 192705258979328.0,
+    "train_loss": 0.34760819860464015,
+    "train_runtime": 3369.3955,
     "train_samples": 817,
+    "train_samples_per_second": 3.152,
     "train_steps_per_second": 0.1
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ff519721bc58711ad03dbc5fa2d3de65f7fe106983d11e8ef6463fe7f0b0e7f6
 size 7505

 version https://git-lfs.github.com/spec/v1
+oid sha256:0bc43e6aa1b1f0a1888b53e2b762df17def16388aa2a369d322f676368ab1a4a
 size 7505