revision = "main" [data] path = "data/french_rap_lyrics" [corpus] encoding = "r50k_base" split_train_val = 0.85 [model] context_length = 256 num_heads = 8 num_layers = 18 hidden_dim = 424 [training] num_training_steps = 20000 seed = 42 lr = 1e-3 batch_size = 64 [scheduler] gamma = 0.925 [evaluation] sample_text = "Les vrais savent que " new_tokens = 50 artist_token = 1 [wandb] mode = "online" # offline or online or disabled group = "fullrun" tags = []