aria-dev commited on
Commit
650061f
1 Parent(s): 914642d

first version

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ model-00001-of-00011.safetensors filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "rhymes-ai/Aria",
3
+ "architectures": [
4
+ "AriaForConditionalGeneration"
5
+ ],
6
+ "auto_map": {
7
+ "AutoConfig": "rhymes-ai/Aria--modeling_aria.AriaConfig",
8
+ "AutoModelForCausalLM": "rhymes-ai/Aria--modeling_aria.AriaForConditionalGeneration"
9
+ },
10
+ "ignore_index": -100,
11
+ "image_token_index": 9,
12
+ "model_type": "aria",
13
+ "projector_patch_to_query_dict": {
14
+ "1225": 128,
15
+ "4900": 256
16
+ },
17
+ "text_config": {
18
+ "hidden_size": 2560,
19
+ "intermediate_size": 13568,
20
+ "max_position_embeddings": 65536,
21
+ "model_type": "aria_moe_lm",
22
+ "moe_intermediate_size": 1664,
23
+ "moe_num_experts": 64,
24
+ "moe_topk": 6,
25
+ "num_attention_heads": 20,
26
+ "num_experts_per_tok": 6,
27
+ "num_hidden_layers": 28,
28
+ "num_key_value_heads": 20,
29
+ "rope_theta": 5000000,
30
+ "vocab_size": 100352
31
+ },
32
+ "torch_dtype": "bfloat16",
33
+ "transformers_version": "4.45.0",
34
+ "vision_config": {
35
+ "_flash_attn_2_enabled": true,
36
+ "architectures": [
37
+ "AriaVisionModel"
38
+ ],
39
+ "hidden_size": 1152,
40
+ "image_size": 980,
41
+ "intermediate_size": 4304,
42
+ "model_type": "aria_vision_model",
43
+ "num_attention_heads": 16,
44
+ "num_hidden_layers": 27,
45
+ "patch_size": 14,
46
+ "torch_dtype": "bfloat16"
47
+ }
48
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "eos_token_id": 2,
5
+ "transformers_version": "4.45.0"
6
+ }
model-00001-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e02efad07993baffd434362bd5f87eba463739e51916a935d7c3d9f3861537e5
3
+ size 4999120264
model-00002-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2537db9b51185a4cb28c6ad0b39651d35bfcd78737ffc92a2b1c8867bdb8f685
3
+ size 4995914928
model-00003-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f117da78dc201876fa162153c70c51d541d8aab17cba6bd04f8063529d70ef77
3
+ size 4997563136
model-00004-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d38972fd1520a0d32b53e152f1a386694c9715d728b41c6d0a469e7ee888151
3
+ size 4997563288
model-00005-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5d9d4a6a63d1d161904663b23c02fbb68985f4e3ec75f48aaa091934cf78b21
3
+ size 4997563720
model-00006-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28a22449ed81d3f02f017097ee77537b7dadfb7566ce677edaed9deb888798cf
3
+ size 4997563720
model-00007-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94c35cb022eefc1ecdd2ae34749482254304dec208586079f4f9097614de13a3
3
+ size 4997563720
model-00008-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d9061071af57e9dd6409da8ea3fe52141e4732ebfc5404e1ec88e3d0bfbb804
3
+ size 4997563720
model-00009-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b823bad6859046328186b45f36a8d2262b3d54e8382cc268e80f6071e68ae267
3
+ size 4997563744
model-00010-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96876b34e229d230a0774f23eb2ec0c1aa46e9a30a9675a0f0c57e7918408bf7
3
+ size 4995915512
model-00011-of-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0678f358f1bd2212855cb1103298df43ac7f6db7f2455a18ca430cd786fa57a9
3
+ size 641615048
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff