Model save

Files changed (5) hide show

adapter_config.json CHANGED Viewed

@@ -21,12 +21,12 @@
   "revision": null,
   "target_modules": [
     "v_proj",
-    "o_proj",
     "k_proj",
     "down_proj",
-    "up_proj",
-    "q_proj",
-    "gate_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "revision": null,
   "target_modules": [
     "v_proj",
+    "q_proj",
+    "gate_proj",
     "k_proj",
+    "o_proj",
     "down_proj",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

all_results.json CHANGED Viewed

@@ -2,8 +2,8 @@
     "epoch": 1.0,
     "total_flos": 0.0,
     "train_loss": 0.0,
-    "train_runtime": 0.0069,
     "train_samples": 20000,
-    "train_samples_per_second": 2900725.475,
-    "train_steps_per_second": 181295.342
 }

     "epoch": 1.0,
     "total_flos": 0.0,
     "train_loss": 0.0,
+    "train_runtime": 0.0105,
     "train_samples": 20000,
+    "train_samples_per_second": 1898476.441,
+    "train_steps_per_second": 118654.778
 }

train_results.json CHANGED Viewed

@@ -2,8 +2,8 @@
     "epoch": 1.0,
     "total_flos": 0.0,
     "train_loss": 0.0,
-    "train_runtime": 0.0069,
     "train_samples": 20000,
-    "train_samples_per_second": 2900725.475,
-    "train_steps_per_second": 181295.342
 }

     "epoch": 1.0,
     "total_flos": 0.0,
     "train_loss": 0.0,
+    "train_runtime": 0.0105,
     "train_samples": 20000,
+    "train_samples_per_second": 1898476.441,
+    "train_steps_per_second": 118654.778
 }

trainer_state.json CHANGED Viewed

@@ -3970,9 +3970,9 @@
       "step": 1250,
       "total_flos": 0.0,
       "train_loss": 0.0,
-      "train_runtime": 0.0069,
-      "train_samples_per_second": 2900725.475,
-      "train_steps_per_second": 181295.342
     }
   ],
   "logging_steps": 5,

       "step": 1250,
       "total_flos": 0.0,
       "train_loss": 0.0,
+      "train_runtime": 0.0105,
+      "train_samples_per_second": 1898476.441,
+      "train_steps_per_second": 118654.778
     }
   ],
   "logging_steps": 5,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eb2a38aa27b8c8dede634e556cdce1523f6cce7ce69726d505dc21c0ad9a1925
 size 6200

 version https://git-lfs.github.com/spec/v1
+oid sha256:dc5b53ff73df66c7260b82ecb294a63bdca90dc2d9429f032457138df19f2d95
 size 6200