Training in progress, step 16

Files changed (7) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "meta-llama/Meta-Llama-3.1-8B-Instruct",
   "architectures": [
     "LlamaForCausalLM"
   ],

 {
+  "_name_or_path": "/home/ubuntu/llama_r1math_grpo_deepspeed/",
   "architectures": [
     "LlamaForCausalLM"
   ],

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e482bc8112bba891e44b882eb20bb40d37800f98d799ca378eb94ffd9399067c
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:4d64929c0e62be2b795c7ba10c247bfb5705b358f472ccd2cf29301efb3dea14
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fb5246694556c8410b1e5f1d203fa09593d802258f69e0b1e7e45235509c7a2e
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:1372bec1259c1fc9e500f0b902dcdd09941879f1c52edd2381da695786dd3f9c
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1918dfe9bfc85325cf8ffc5b2d4b0fe83ba881d62782c0be0e9a94751b3b8f38
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:fefe3969ec00b21fb8637d489962a6d62496c2f4bae7353e3f56a48a2e89da9c
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5b8718584ff8f6b9edecb63f204845f0570e395258314208e74a466b7c9eb113
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:31225bf9b42ea76c70a02e26ab1bfcd210e0d77609849ebdee5fd089a809c820
 size 1168138808

tokenizer_config.json CHANGED Viewed

@@ -2054,11 +2054,15 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|eot_id|>",
   "extra_special_tokens": {},
   "model_input_names": [
     "input_ids",
     "attention_mask"
   ],
   "model_max_length": 131072,
   "pad_token": "<|reserved_special_token_0|>",
   "tokenizer_class": "PreTrainedTokenizerFast"
 }

   "clean_up_tokenization_spaces": true,
   "eos_token": "<|eot_id|>",
   "extra_special_tokens": {},
+  "max_length": null,
   "model_input_names": [
     "input_ids",
     "attention_mask"
   ],
   "model_max_length": 131072,
+  "pad_to_multiple_of": null,
   "pad_token": "<|reserved_special_token_0|>",
+  "pad_token_type_id": 0,
+  "padding_side": "left",
   "tokenizer_class": "PreTrainedTokenizerFast"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a454ab36f976f70255ab7afa5520734206a990c323f43d55fe5e2e02f4821ed2
 size 7672

 version https://git-lfs.github.com/spec/v1
+oid sha256:1af291767493af3eab35139a2601f95a2759a8336fbd5310a0ed5843bad536c7
 size 7672