Model save

Files changed (6) hide show

README.md CHANGED Viewed

@@ -27,7 +27,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/yknxxh-seoul-national-university/huggingface/runs/871radgp)
 This model was trained with SFT.

 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/yknxxh-seoul-national-university/huggingface/runs/wjpxhixe)
 This model was trained with SFT.

all_results.json CHANGED Viewed

@@ -2,8 +2,8 @@
     "epoch": 0.96,
     "total_flos": 96668442181632.0,
     "train_loss": 3.916761557261149,
-    "train_runtime": 4.5312,
     "train_samples": 100,
-    "train_samples_per_second": 22.069,
-    "train_steps_per_second": 1.324
 }

     "epoch": 0.96,
     "total_flos": 96668442181632.0,
     "train_loss": 3.916761557261149,
+    "train_runtime": 4.2749,
     "train_samples": 100,
+    "train_samples_per_second": 23.392,
+    "train_steps_per_second": 1.404
 }

runs/Feb09_15-41-09_yekyung-nah-0/events.out.tfevents.1739083280.yekyung-nah-0.118709.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d17a1a41137b51918828528f871e4b8ec726ca585e6afb22679b135472456cd9
+size 6951

train_results.json CHANGED Viewed

@@ -2,8 +2,8 @@
     "epoch": 0.96,
     "total_flos": 96668442181632.0,
     "train_loss": 3.916761557261149,
-    "train_runtime": 4.5312,
     "train_samples": 100,
-    "train_samples_per_second": 22.069,
-    "train_steps_per_second": 1.324
 }

     "epoch": 0.96,
     "total_flos": 96668442181632.0,
     "train_loss": 3.916761557261149,
+    "train_runtime": 4.2749,
     "train_samples": 100,
+    "train_samples_per_second": 23.392,
+    "train_steps_per_second": 1.404
 }

trainer_state.json CHANGED Viewed

@@ -25,9 +25,9 @@
     {
       "epoch": 0.96,
       "eval_loss": 2.263831377029419,
-      "eval_runtime": 0.0996,
-      "eval_samples_per_second": 100.398,
-      "eval_steps_per_second": 30.119,
       "step": 6
     },
     {
@@ -35,9 +35,9 @@
       "step": 6,
       "total_flos": 96668442181632.0,
       "train_loss": 3.916761557261149,
-      "train_runtime": 4.5312,
-      "train_samples_per_second": 22.069,
-      "train_steps_per_second": 1.324
     }
   ],
   "logging_steps": 5,

     {
       "epoch": 0.96,
       "eval_loss": 2.263831377029419,
+      "eval_runtime": 0.1012,
+      "eval_samples_per_second": 98.826,
+      "eval_steps_per_second": 29.648,
       "step": 6
     },
     {
       "step": 6,
       "total_flos": 96668442181632.0,
       "train_loss": 3.916761557261149,
+      "train_runtime": 4.2749,
+      "train_samples_per_second": 23.392,
+      "train_steps_per_second": 1.404
     }
   ],
   "logging_steps": 5,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7aaa8b03d6293c40c8947039a1a14e32fb140a4dce8f833ee211be46d7bf4b95
 size 5816

 version https://git-lfs.github.com/spec/v1
+oid sha256:f16737eef625c46b4954dd8bebeedbb75c359563af0b55303c3e086d9bf229d0
 size 5816