Create README.md
Browse files
README.md
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# This repo contains EleutherAI/gpt-j-6B fine tuned on OWCA (https://github.com/Emplocity/owca) using LoRa
|
2 |
+
|
3 |
+
Training params:
|
4 |
+
MICRO_BATCH_SIZE = 64
|
5 |
+
BATCH_SIZE = 128
|
6 |
+
GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // MICRO_BATCH_SIZE
|
7 |
+
EPOCHS = 3
|
8 |
+
LEARNING_RATE = 2e-5
|
9 |
+
CUTOFF_LEN = 256
|
10 |
+
LORA_R = 4
|
11 |
+
LORA_ALPHA = 16
|
12 |
+
LORA_DROPOUT = 0.05
|
13 |
+
warmup_steps=100
|
14 |
+
fp16=True
|