vinallama_fine_tune_test

Files changed (7) hide show

README.md CHANGED Viewed

@@ -35,13 +35,13 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 2.5e-05
 - train_batch_size: 8
-- eval_batch_size: 2
 - seed: 42
 - gradient_accumulation_steps: 4
 - total_train_batch_size: 32
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- training_steps: 200
 - mixed_precision_training: Native AMP
 ### Training results

 The following hyperparameters were used during training:
 - learning_rate: 2.5e-05
 - train_batch_size: 8
+- eval_batch_size: 32
 - seed: 42
 - gradient_accumulation_steps: 4
 - total_train_batch_size: 32
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- training_steps: 100
 - mixed_precision_training: Native AMP
 ### Training results

adapter_config.json CHANGED Viewed

@@ -23,8 +23,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
-    "v_proj"
   ],
   "task_type": null,
   "use_dora": false,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "v_proj",
+    "q_proj"
   ],
   "task_type": null,
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9ee1afae0891d5b930a7321ccadccc5d48fb681757bb5b4768aba25267527725
 size 10502640

 version https://git-lfs.github.com/spec/v1
+oid sha256:043d23bf70c3022a9880c507d9f89b134d581ebee7d158fce04f804a6ef106fb
 size 10502640

special_tokens_map.json CHANGED Viewed

@@ -13,13 +13,7 @@
     "rstrip": false,
     "single_word": false
   },
-  "pad_token": {
-    "content": "<pad>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

     "rstrip": false,
     "single_word": false
   },
+  "pad_token": "<|im_end|>",
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

tokenizer.json CHANGED Viewed

@@ -12,9 +12,9 @@
     },
     "direction": "Right",
     "pad_to_multiple_of": null,
-    "pad_id": 46303,
     "pad_type_id": 0,
-    "pad_token": "<pad>"
   },
   "added_tokens": [
     {

     },
     "direction": "Right",
     "pad_to_multiple_of": null,
+    "pad_id": 46304,
     "pad_type_id": 0,
+    "pad_token": "<|im_end|>"
   },
   "added_tokens": [
     {

tokenizer_config.json CHANGED Viewed

@@ -56,7 +56,7 @@
   "eos_token": "<|im_end|>",
   "legacy": false,
   "model_max_length": 1000000000000000019884624838656,
-  "pad_token": "<pad>",
   "padding_side": "right",
   "sp_model_kwargs": {},
   "tokenizer_class": "LlamaTokenizer",

   "eos_token": "<|im_end|>",
   "legacy": false,
   "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<|im_end|>",
   "padding_side": "right",
   "sp_model_kwargs": {},
   "tokenizer_class": "LlamaTokenizer",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3afac9650910a8011568713c10c52c43da4f662953a2fb5f88d961addab4b55f
 size 4856

 version https://git-lfs.github.com/spec/v1
+oid sha256:06efba0e0cd05edac47a4783d151793b8eab3181f8808b37ba0db275e97e19a7
 size 4856