OumaymaeELBIACH/Llama-3.2-1B

Files changed (13) hide show

README.md CHANGED Viewed

@@ -27,17 +27,18 @@ print(output["generated_text"])
 ## Training procedure
 This model was trained with SFT.
 ### Framework versions
-- TRL: 0.12.1
-- Transformers: 4.47.0.dev0
 - Pytorch: 2.5.1+cu121
-- Datasets: 3.1.0
-- Tokenizers: 0.20.3
 ## Citations

 ## Training procedure
 This model was trained with SFT.
 ### Framework versions
+- TRL: 0.13.0
+- Transformers: 4.48.0.dev0
 - Pytorch: 2.5.1+cu121
+- Datasets: 3.2.0
+- Tokenizers: 0.21.0
 ## Citations

adapter_config.json CHANGED Viewed

@@ -1,8 +1,10 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "meta-llama/Llama-3.2-1B",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
@@ -11,16 +13,22 @@
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 16,
-  "lora_dropout": 0.01,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
-  "r": 64,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
     "q_proj"
   ],
   "task_type": "CAUSAL_LM",

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": null,
   "bias": "none",
+  "eva_config": null,
+  "exclude_modules": null,
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 16,
+  "lora_bias": false,
+  "lora_dropout": 0.05,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "r": 32,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "k_proj",
+    "down_proj",
     "v_proj",
+    "gate_proj",
+    "o_proj",
+    "up_proj",
     "q_proj"
   ],
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:85f7a406b86ad48dfe0dcc2e29bb7998542ad32de42e43384d715c625d202510
-size 27271552

 version https://git-lfs.github.com/spec/v1
+oid sha256:2f1899b3a34b3ffdf37183d38ab11eeefc73aa1f2ae8d73109040919444d8822
+size 90211056

runs/Dec28_11-57-34_98a9f987451e/events.out.tfevents.1735387732.98a9f987451e.2637.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e466a087bffc2ad40dc4fd84cb55a32bc001d9cc164a01db4d9b91fee4cd72e
+size 12293

runs/Dec28_12-28-31_98a9f987451e/events.out.tfevents.1735388922.98a9f987451e.2637.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b83c2ce77315e2d776e16dbe8f7f32fcc83aeacb18f2a203324763f0dc7e13d8
+size 7150

runs/Dec28_12-29-45_98a9f987451e/events.out.tfevents.1735388992.98a9f987451e.2637.2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:17252feaf7c9b17abab8422f2c5eeb676a4acae7c766f3228799c53a6fcdb390
+size 8612

runs/Dec28_12-29-45_98a9f987451e/events.out.tfevents.1735389115.98a9f987451e.2637.3 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:dfbde96b7e45728f75cab444baf508a45a70924565b5e3ef42f6a12f917c0b23
+size 359

runs/Dec28_12-32-30_98a9f987451e/events.out.tfevents.1735389169.98a9f987451e.2637.4 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a73a075a3e5678126ba5bf5e26e3bfffe05470451b8038a63c4e4c4c5c83a579
+size 8065

runs/Dec28_12-39-31_98a9f987451e/events.out.tfevents.1735389580.98a9f987451e.2637.5 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:559d9230cfeae739d7a86a67544741c27ad795cba81c41205fed7c4c78570be7
+size 9338

runs/Dec28_12-41-49_98a9f987451e/events.out.tfevents.1735389720.98a9f987451e.2637.6 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a3758a15f9334ec76ab869a8a181c2aa0fd05e70fb51da3fa61d2edccdb5b977
+size 12293

runs/Dec28_12-41-49_98a9f987451e/events.out.tfevents.1735389915.98a9f987451e.2637.7 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3875ac9ee87bd9d91c53556ec4098e52289b70f604048e781a0874507272e11f
+size 359

tokenizer_config.json CHANGED Viewed

@@ -2057,7 +2057,7 @@
     "input_ids",
     "attention_mask"
   ],
-  "model_max_length": 131072,
   "pad_token": "<|end_of_text|>",
   "tokenizer_class": "PreTrainedTokenizerFast"
 }

     "input_ids",
     "attention_mask"
   ],
+  "model_max_length": 512,
   "pad_token": "<|end_of_text|>",
   "tokenizer_class": "PreTrainedTokenizerFast"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ff3c5fb17ab9fed6d5dbff5a72aa2f2a65a67faaecf79dd12a2e26047356773c
 size 5560

 version https://git-lfs.github.com/spec/v1
+oid sha256:e25a9f108a56883d0624e13cab53d79daed3fb00f5e4e0d0bc3415a753fa4ac0
 size 5560