Vikhrmodels
/

Vikhr-7b-0.1

0x7o commited on Mar 11

Commit

386d754

•

1 Parent(s): 2f88a56

Correcting from Llama to Mistral (#3)

- Correcting from Llama to Mistral (3c99efacc03dab7a640e44c779c9f4bd78aa0f79)

Co-authored-by: Danil Kononyuk <[email protected]>

Files changed (1) hide show

config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "_name_or_path": "Vikhrmodels/Vikhr-7b-0.1",
   "architectures": [
-    "LlamaForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
@@ -12,7 +12,7 @@
   "initializer_range": 0.02,
   "intermediate_size": 14336,
   "max_position_embeddings": 32768,
-  "model_type": "llama",
   "num_attention_heads": 32,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,

 {
   "_name_or_path": "Vikhrmodels/Vikhr-7b-0.1",
   "architectures": [
+    "MistralForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "initializer_range": 0.02,
   "intermediate_size": 14336,
   "max_position_embeddings": 32768,
+  "model_type": "mistral",
   "num_attention_heads": 32,
   "num_hidden_layers": 32,
   "num_key_value_heads": 8,