jkazdan commited on
Commit
526335a
·
verified ·
1 Parent(s): 85afdfd

jkazdan/gemma-2-9b-it-refusal-trial-2

Browse files
README.md CHANGED
@@ -1,4 +1,5 @@
1
  ---
 
2
  license: gemma
3
  base_model: google/gemma-2-9b-it
4
  tags:
@@ -34,15 +35,15 @@ More information needed
34
  ### Training hyperparameters
35
 
36
  The following hyperparameters were used during training:
37
- - learning_rate: 2e-05
38
- - train_batch_size: 16
39
  - eval_batch_size: 4
40
  - seed: 42
41
  - gradient_accumulation_steps: 4
42
- - total_train_batch_size: 64
43
- - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: linear
45
- - num_epochs: 3
46
 
47
  ### Training results
48
 
@@ -50,7 +51,7 @@ The following hyperparameters were used during training:
50
 
51
  ### Framework versions
52
 
53
- - Transformers 4.44.0
54
  - Pytorch 2.4.0+cu121
55
  - Datasets 2.20.0
56
- - Tokenizers 0.19.1
 
1
  ---
2
+ library_name: transformers
3
  license: gemma
4
  base_model: google/gemma-2-9b-it
5
  tags:
 
35
  ### Training hyperparameters
36
 
37
  The following hyperparameters were used during training:
38
+ - learning_rate: 1e-06
39
+ - train_batch_size: 4
40
  - eval_batch_size: 4
41
  - seed: 42
42
  - gradient_accumulation_steps: 4
43
+ - total_train_batch_size: 16
44
+ - optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
45
  - lr_scheduler_type: linear
46
+ - num_epochs: 1
47
 
48
  ### Training results
49
 
 
51
 
52
  ### Framework versions
53
 
54
+ - Transformers 4.46.3
55
  - Pytorch 2.4.0+cu121
56
  - Datasets 2.20.0
57
+ - Tokenizers 0.20.3
config.json CHANGED
@@ -28,7 +28,7 @@
28
  "sliding_window": 4096,
29
  "sliding_window_size": 4096,
30
  "torch_dtype": "bfloat16",
31
- "transformers_version": "4.44.0",
32
  "use_cache": true,
33
  "vocab_size": 256000
34
  }
 
28
  "sliding_window": 4096,
29
  "sliding_window_size": 4096,
30
  "torch_dtype": "bfloat16",
31
+ "transformers_version": "4.46.3",
32
  "use_cache": true,
33
  "vocab_size": 256000
34
  }
generation_config.json CHANGED
@@ -4,5 +4,5 @@
4
  "cache_implementation": "hybrid",
5
  "eos_token_id": 1,
6
  "pad_token_id": 0,
7
- "transformers_version": "4.44.0"
8
  }
 
4
  "cache_implementation": "hybrid",
5
  "eos_token_id": 1,
6
  "pad_token_id": 0,
7
+ "transformers_version": "4.46.3"
8
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:530bd8a94e89eda879bf4c9753fec7a306eef19167030ebe92490edba1f91a21
3
  size 4903351912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d21c815a79a443a942da9f64d2af8fab0b7c840264b5645a80fc4fad27c66454
3
  size 4903351912
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e24e3ddd538ea498d38b99eadca29a791f5b4d451298091b09d3f6515674f35
3
  size 4947570872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8493969dfc6a06965a0c1562552e64e0c7a236e889d0ca84a70ff4488422a710
3
  size 4947570872
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:179cdb24fdc34c4b94a68d19dff3e32a64adf61c00577c3a6e9a9e6815bbf446
3
  size 4962221464
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:865fa2b31a6e02702e2c4f77ea65e2fe24398a6fe0acb7655608194b94f4664b
3
  size 4962221464
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12c5dcacf684cf8cbe8b0b9e19c16758bcc93e6a4b41cc70b39f2e9e61de6953
3
  size 3670322200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98016cd419abad87673ac54a3a58bdf3dfbdcfed32d6027e80b775f2ffc94270
3
  size 3670322200
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bfe58439dfe238895cfe3b3dfb36820b68d032fd1dc6681c6dad658d595534a3
3
- size 17525622
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f7eee611703c5ce5d1eee32d9cdcfe465647b8aff0c1dfb3bed7ad7dbb05060
3
+ size 34362873
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8d9633f0dd03e72b0ee5ea88713a42319dae771333dd39d8619022725b1e5be
3
- size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a43a1e537062b9cc1b2b3180ed2e32ac4b6ee294390b2e8fb4c2016e0341910a
3
+ size 5560