End of training

Browse files

Files changed (12) hide show

README.md +82 -0
adapter_config.json +34 -0
adapter_model.safetensors +3 -0
generation_config.json +7 -0
runs/Apr03_11-58-29_driver-77548c5448-n2rds/events.out.tfevents.1712145518.driver-77548c5448-n2rds.2740.0 +3 -0
runs/Apr03_12-25-46_driver-548f4dfd-hr96f/events.out.tfevents.1712147150.driver-548f4dfd-hr96f.3252.0 +3 -0
runs/Apr03_12-26-58_driver-548f4dfd-hr96f/events.out.tfevents.1712147222.driver-548f4dfd-hr96f.3252.1 +3 -0
runs/Apr03_12-48-23_driver-6fc58c79cc-xl4ll/events.out.tfevents.1712148511.driver-6fc58c79cc-xl4ll.3492.0 +3 -0
runs/Apr03_12-49-16_driver-6fc58c79cc-xl4ll/events.out.tfevents.1712148563.driver-6fc58c79cc-xl4ll.3492.1 +3 -0
runs/Apr03_12-49-40_driver-6fc58c79cc-xl4ll/events.out.tfevents.1712148584.driver-6fc58c79cc-xl4ll.3492.2 +3 -0
runs/Apr03_12-49-53_driver-6fc58c79cc-xl4ll/events.out.tfevents.1712148596.driver-6fc58c79cc-xl4ll.3492.3 +3 -0
training_args.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,82 @@

+---
+license: gemma
+base_model: google/gemma-2b-it
+tags:
+- generated_from_trainer
+model-index:
+- name: logs
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# logs
+This model is a fine-tuned version of [google/gemma-2b-it](https://huggingface.co/google/gemma-2b-it) on the None dataset.
+It achieves the following results on the evaluation set:
+- Loss: 2.6513
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0002
+- train_batch_size: 4
+- eval_batch_size: 8
+- seed: 42
+- distributed_type: multi-GPU
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: cosine
+- lr_scheduler_warmup_ratio: 0.03
+- num_epochs: 2
+- mixed_precision_training: Native AMP
+### Training results
+| Training Loss | Epoch | Step | Validation Loss |
+|:-------------:|:-----:|:----:|:---------------:|
+| 3.1035        | 0.08  | 112  | 3.1213          |
+| 3.0698        | 0.17  | 224  | 3.0171          |
+| 3.0451        | 0.25  | 336  | 2.9717          |
+| 2.8939        | 0.33  | 448  | 2.9336          |
+| 2.8892        | 0.42  | 560  | 2.9099          |
+| 2.8566        | 0.5   | 672  | 2.8757          |
+| 2.8654        | 0.58  | 784  | 2.8486          |
+| 2.8261        | 0.67  | 896  | 2.8291          |
+| 2.8868        | 0.75  | 1008 | 2.7998          |
+| 2.819         | 0.84  | 1120 | 2.7781          |
+| 2.8064        | 0.92  | 1232 | 2.7543          |
+| 2.761         | 1.0   | 1344 | 2.7338          |
+| 2.3883        | 1.09  | 1456 | 2.7416          |
+| 2.3511        | 1.17  | 1568 | 2.7239          |
+| 2.3174        | 1.25  | 1680 | 2.7140          |
+| 2.3234        | 1.34  | 1792 | 2.7004          |
+| 2.3364        | 1.42  | 1904 | 2.6826          |
+| 2.3079        | 1.5   | 2016 | 2.6718          |
+| 2.2965        | 1.59  | 2128 | 2.6649          |
+| 2.2233        | 1.67  | 2240 | 2.6626          |
+| 2.2199        | 1.75  | 2352 | 2.6590          |
+| 2.3126        | 1.84  | 2464 | 2.6526          |
+| 2.2602        | 1.92  | 2576 | 2.6513          |
+### Framework versions
+- Transformers 4.39.3
+- Pytorch 2.0.0+cu117
+- Datasets 2.16.0
+- Tokenizers 0.15.0

adapter_config.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "google/gemma-2b-it",
+  "bias": "none",
+  "fan_in_fan_out": false,
+  "inference_mode": false,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 16,
+  "lora_dropout": 0,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 64,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "q_proj",
+    "o_proj",
+    "gate_proj",
+    "up_proj",
+    "down_proj",
+    "k_proj",
+    "v_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "use_dora": false,
+  "use_rslora": false
+}

adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ebbcd8f654f927a34934eeff1e3790bd92a88fb72dd137865e276a51b69cc47f
+size 313820248

generation_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 2,
+  "eos_token_id": 1,
+  "pad_token_id": 0,
+  "transformers_version": "4.39.3"
+}

runs/Apr03_11-58-29_driver-77548c5448-n2rds/events.out.tfevents.1712145518.driver-77548c5448-n2rds.2740.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1769e9da4dcd2b6afd3b2a81da0146af8029c5274872dde0b95013082b322e10
+size 4184

runs/Apr03_12-25-46_driver-548f4dfd-hr96f/events.out.tfevents.1712147150.driver-548f4dfd-hr96f.3252.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb8ad484568e443b89f4832f4a72c4634305db529b09213ac78187f34bd4fbf8
+size 5120

runs/Apr03_12-26-58_driver-548f4dfd-hr96f/events.out.tfevents.1712147222.driver-548f4dfd-hr96f.3252.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b8f686df8aea92f417160da9c1a4cccdc37b74d63162784888459eb80c0c0881
+size 5120

runs/Apr03_12-48-23_driver-6fc58c79cc-xl4ll/events.out.tfevents.1712148511.driver-6fc58c79cc-xl4ll.3492.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d3a27cf99d2bcfdf744e24452d5a46a16b8c2fd749785dc057229b9fc58c1ace
+size 5536

runs/Apr03_12-49-16_driver-6fc58c79cc-xl4ll/events.out.tfevents.1712148563.driver-6fc58c79cc-xl4ll.3492.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a610fa6d74cfaec0ff0b01ab3d7c79bb95888ac9913d5322263ad800a02d7b9e
+size 5123

runs/Apr03_12-49-40_driver-6fc58c79cc-xl4ll/events.out.tfevents.1712148584.driver-6fc58c79cc-xl4ll.3492.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d9f4b80d4b764117a414ba46ecd29befb7de6428cc34a8bf9f72ea5d3bbe561d
+size 5122

runs/Apr03_12-49-53_driver-6fc58c79cc-xl4ll/events.out.tfevents.1712148596.driver-6fc58c79cc-xl4ll.3492.3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b9310b3ff65cbb7418c600d26fd6bf9ee84c81590c0ff07c022a30d389024348
+size 34261

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68d94773e611d4d24e7daadeb2d9303f9264db5cdb756290b354112e92f8687a
+size 4411