Upload model

Files changed (4) hide show

README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-base_model: bigcode/starcoder2-7b
 library_name: transformers
 model_name: finetune_starcoder2
 tags:
@@ -11,7 +11,7 @@ licence: license
 # Model Card for finetune_starcoder2
-This model is a fine-tuned version of [bigcode/starcoder2-7b](https://huggingface.co/bigcode/starcoder2-7b).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
@@ -27,7 +27,7 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/roham-koohestani/huggingface/runs/lskxusrv)
 This model was trained with SFT.

 ---
+base_model: bigcode/starcoder2-15b
 library_name: transformers
 model_name: finetune_starcoder2
 tags:
 # Model Card for finetune_starcoder2
+This model is a fine-tuned version of [bigcode/starcoder2-15b](https://huggingface.co/bigcode/starcoder2-15b).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/roham-koohestani/huggingface/runs/3ryf9ebs)
 This model was trained with SFT.

adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "bigcode/starcoder2-7b",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -19,13 +19,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "gate_proj",
-    "down_proj",
-    "q_proj",
     "k_proj",
-    "v_proj",
     "up_proj",
-    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "bigcode/starcoder2-15b",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "k_proj",
+    "o_proj",
+    "q_proj",
     "up_proj",
+    "v_proj",
+    "gate_proj",
+    "down_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_rslora": false

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f308bb7940b210b74980f43cf63b220d87cdea17008ecd11c61b3724bdc43fd0
-size 29394136

 version https://git-lfs.github.com/spec/v1
+oid sha256:3396e5b09204b736c2df744616e762d4fadbfe22056cec3f2bfb4cffb32ebab8
+size 48539256

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:35b727aaf1805ad9e94a6f7eab28696d1c71fab4d4a112c6acf811c7f7bfc5c2
 size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:0e5c1cc5abf22171287110ec5c0234d89ed2d8c24eb5f1ac9e449c91f84efbb7
 size 5496