SebastianBodza commited on 10 days ago

Commit

aed8093

verified ·

1 Parent(s): 63c0709

Add files using upload-large-folder tool

Browse files

Files changed (46) hide show

.gitattributes +8 -0
checkpoint-10989/config.json +40 -0
checkpoint-10989/generation_config.json +12 -0
checkpoint-10989/model.safetensors +3 -0
checkpoint-10989/optimizer.pt +3 -0
checkpoint-10989/rng_state_0.pth +3 -0
checkpoint-10989/rng_state_1.pth +3 -0
checkpoint-10989/rng_state_2.pth +3 -0
checkpoint-10989/rng_state_3.pth +3 -0
checkpoint-10989/scheduler.pt +3 -0
checkpoint-10989/special_tokens_map.json +17 -0
checkpoint-10989/tokenizer.json +3 -0
checkpoint-10989/tokenizer_config.json +3 -0
checkpoint-10989/trainer_state.json +0 -0
checkpoint-10989/training_args.bin +3 -0
checkpoint-11988/config.json +40 -0
checkpoint-11988/generation_config.json +12 -0
checkpoint-11988/model.safetensors +3 -0
checkpoint-11988/optimizer.pt +3 -0
checkpoint-11988/rng_state_0.pth +3 -0
checkpoint-11988/rng_state_1.pth +3 -0
checkpoint-11988/rng_state_2.pth +3 -0
checkpoint-11988/rng_state_3.pth +3 -0
checkpoint-11988/scheduler.pt +3 -0
checkpoint-11988/special_tokens_map.json +17 -0
checkpoint-11988/tokenizer.json +3 -0
checkpoint-11988/tokenizer_config.json +3 -0
checkpoint-11988/trainer_state.json +0 -0
checkpoint-11988/training_args.bin +3 -0
checkpoint-9990/config.json +40 -0
checkpoint-9990/generation_config.json +12 -0
checkpoint-9990/model.safetensors +3 -0
checkpoint-9990/optimizer.pt +3 -0
checkpoint-9990/rng_state_0.pth +3 -0
checkpoint-9990/rng_state_1.pth +3 -0
checkpoint-9990/rng_state_2.pth +3 -0
checkpoint-9990/rng_state_3.pth +3 -0
checkpoint-9990/scheduler.pt +3 -0
checkpoint-9990/special_tokens_map.json +17 -0
checkpoint-9990/tokenizer.json +3 -0
checkpoint-9990/tokenizer_config.json +3 -0
checkpoint-9990/trainer_state.json +0 -0
checkpoint-9990/training_args.bin +3 -0
special_tokens_map.json +17 -0
tokenizer.json +3 -0
tokenizer_config.json +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,11 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+checkpoint-9990/tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-10989/tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-11988/tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
+tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-10989/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-11988/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+checkpoint-9990/tokenizer.json filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

checkpoint-10989/config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "_name_or_path": "/home/user/LLaSA_training/output/checkpoint-6993",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 128000,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "head_dim": 64,
+  "hidden_act": "silu",
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 8192,
+  "max_position_embeddings": 131072,
+  "mlp_bias": false,
+  "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 16,
+  "num_key_value_heads": 8,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": {
+    "factor": 32.0,
+    "high_freq_factor": 4.0,
+    "low_freq_factor": 1.0,
+    "original_max_position_embeddings": 8192,
+    "rope_type": "llama3"
+  },
+  "rope_theta": 500000.0,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.48.3",
+  "use_cache": true,
+  "vocab_size": 193800
+}

checkpoint-10989/generation_config.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+  "bos_token_id": 128000,
+  "do_sample": true,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "temperature": 0.6,
+  "top_p": 0.9,
+  "transformers_version": "4.48.3"
+}

checkpoint-10989/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:edbc5d6a59d1f579bf4cb4001bdae6e50546c5b1b6b1ebff471278398d8e26c7
+size 2740113872

checkpoint-10989/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f65230d51460bb20815c47c619870667570176a2a2418b17fc8eb42c129b7b57
+size 5480320942

checkpoint-10989/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6c6d1d381278fb22b22bfd8330681970ee2403fa0d0b445b2ee7a21b7f082f9f
+size 15024

checkpoint-10989/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0178e3284ccbfd37ac137f698b5f99a9e7d27de640fdfe23cf8fa488b77d5395
+size 15024

checkpoint-10989/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7bec3b6fff9b26029e4109665d06520223e4667ca532d843849539f6c81b589
+size 15024

checkpoint-10989/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e252f8fd1f83562b36f69fd209feb4eb1542571be5a4e8ac315090db3730fd59
+size 15024

checkpoint-10989/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e31c0a73dd93ca495bc0a74af5563f04de0697e5158a6917a5467b8fb542aa5
+size 1064

checkpoint-10989/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "bos_token": {
+    "content": "<|begin_of_text|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|eot_id|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|eot_id|>"
+}

checkpoint-10989/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:71d92f3dbf3c23d734e6356241cef149b42fe79848176a54145b6f9a886fd73b
+size 29521206

checkpoint-10989/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62c494500e8d6ec069de7d95f2948aec356a9618c746f8b8e23905d3a3685607
+size 11710504

checkpoint-10989/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-10989/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:089b58f069d2fc49b7875c2d04f364dad8873f35aaa15889bbb70e8f374c8bf4
+size 5432

checkpoint-11988/config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "_name_or_path": "/home/user/LLaSA_training/output/checkpoint-6993",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 128000,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "head_dim": 64,
+  "hidden_act": "silu",
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 8192,
+  "max_position_embeddings": 131072,
+  "mlp_bias": false,
+  "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 16,
+  "num_key_value_heads": 8,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": {
+    "factor": 32.0,
+    "high_freq_factor": 4.0,
+    "low_freq_factor": 1.0,
+    "original_max_position_embeddings": 8192,
+    "rope_type": "llama3"
+  },
+  "rope_theta": 500000.0,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.48.3",
+  "use_cache": true,
+  "vocab_size": 193800
+}

checkpoint-11988/generation_config.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+  "bos_token_id": 128000,
+  "do_sample": true,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "temperature": 0.6,
+  "top_p": 0.9,
+  "transformers_version": "4.48.3"
+}

checkpoint-11988/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf45ffa0820a407501f6361cc7e49657e339ca9862502d3901a1d6e478b7c1b4
+size 2740113872

checkpoint-11988/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:232ad0212692ad67a2130315c7dccdb7e7f1881d21c76073af58484d0a1e8969
+size 5480320942

checkpoint-11988/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eca6265e8e2262bb5c15a70d21454a6b211b9b2d32d9dc8148906e78ea170eaf
+size 15024

checkpoint-11988/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68d7aae23c0ad281a5723c42d3d0c2b4dad0be21eba7d073650ee2fc41e43602
+size 15024

checkpoint-11988/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:465be5b0a5af7606f9f257a8f2d7c4169c76acb06f8360d1e9ee648b1a569c0e
+size 15024

checkpoint-11988/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d0ec1844e355f804002cdc7088f40050d1244340689686f1b8dadac9301738f
+size 15024

checkpoint-11988/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f1ae34a2c530c2bace1a13db2d90698a935428b3aa25b8be38d362162e1f72f
+size 1064

checkpoint-11988/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "bos_token": {
+    "content": "<|begin_of_text|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|eot_id|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|eot_id|>"
+}

checkpoint-11988/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:71d92f3dbf3c23d734e6356241cef149b42fe79848176a54145b6f9a886fd73b
+size 29521206

checkpoint-11988/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62c494500e8d6ec069de7d95f2948aec356a9618c746f8b8e23905d3a3685607
+size 11710504

checkpoint-11988/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-11988/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:089b58f069d2fc49b7875c2d04f364dad8873f35aaa15889bbb70e8f374c8bf4
+size 5432

checkpoint-9990/config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+  "_name_or_path": "/home/user/LLaSA_training/output/checkpoint-6993",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 128000,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "head_dim": 64,
+  "hidden_act": "silu",
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 8192,
+  "max_position_embeddings": 131072,
+  "mlp_bias": false,
+  "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 16,
+  "num_key_value_heads": 8,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": {
+    "factor": 32.0,
+    "high_freq_factor": 4.0,
+    "low_freq_factor": 1.0,
+    "original_max_position_embeddings": 8192,
+    "rope_type": "llama3"
+  },
+  "rope_theta": 500000.0,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.48.3",
+  "use_cache": true,
+  "vocab_size": 193800
+}

checkpoint-9990/generation_config.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+  "bos_token_id": 128000,
+  "do_sample": true,
+  "eos_token_id": [
+    128001,
+    128008,
+    128009
+  ],
+  "temperature": 0.6,
+  "top_p": 0.9,
+  "transformers_version": "4.48.3"
+}

checkpoint-9990/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:812dfd372979218787af53e6bd78c70fa24d4931b4cba1d2c1659d84a3fe6a7e
+size 2740113872

checkpoint-9990/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1edc0ce469772a4fc39f5c5390efef7c658521c448c28499234f1cd9a2ea7195
+size 5480320942

checkpoint-9990/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:727a29225b3a57083df6716f89d12c226f440fba33b2cf3a11cc14fc56415bee
+size 15024

checkpoint-9990/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b19196062cac6851e7878550f3ec18df650454294f22a73327cd60bb311d5ca3
+size 15024

checkpoint-9990/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c7af4b14a44a7c67224cb1f18ec389134691f8634f287e688088f6a77ce1c429
+size 15024

checkpoint-9990/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f8425db93d8404ce5c39c969d20421626b818c961f184172ec3765868123dae2
+size 15024

checkpoint-9990/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32d71093b013ac39e5d757049d80833036773c1d2ab19f549a6897512d29eee3
+size 1064

checkpoint-9990/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "bos_token": {
+    "content": "<|begin_of_text|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|eot_id|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|eot_id|>"
+}

checkpoint-9990/tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:71d92f3dbf3c23d734e6356241cef149b42fe79848176a54145b6f9a886fd73b
+size 29521206

checkpoint-9990/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62c494500e8d6ec069de7d95f2948aec356a9618c746f8b8e23905d3a3685607
+size 11710504

checkpoint-9990/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-9990/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:089b58f069d2fc49b7875c2d04f364dad8873f35aaa15889bbb70e8f374c8bf4
+size 5432

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,17 @@

+{
+  "bos_token": {
+    "content": "<|begin_of_text|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|eot_id|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<|end_of_text|>"
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:71d92f3dbf3c23d734e6356241cef149b42fe79848176a54145b6f9a886fd73b
+size 29521206

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4d1ba0909d80bd18ffa22e8c05ebf509ae17b5b85d6e31e7a00bb11a1700cdd5
+size 11710509