Blackroot's picture
Upload 18 files
6aced58 verified
raw
history blame
419 Bytes
from dataclasses import dataclass
@dataclass
class LlamaConfig:
hidden_size: int = 576
num_attention_heads: int = 16
num_key_value_heads: int = 4
num_hidden_layers: int = 30
intermediate_size: int = 1536
hidden_act: str = "silu"
rms_norm_eps: float = 1e-5
vocab_size: int = 49152
max_position_embeddings: int = 8192
rope_theta: int = 100000
tie_word_embeddings: bool = False