SLM3 / configuration_gpt.py
Ronakparmar's picture
Upload 4 files
500f774 verified
from dataclasses import dataclass
from transformers import PretrainedConfig
@dataclass
class CustomGPTConfig(PretrainedConfig):
"""
Configuration class for custom GPT model.
"""
model_type = "custom_gpt"
block_size: int = 768
vocab_size: int = 50257
n_layer: int = 8
n_head: int = 8
n_embd: int = 768
dropout: float = 0.1