Update logs

Files changed (5) hide show

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run_gpt_neo.sh CHANGED Viewed

@@ -5,32 +5,36 @@ export HF_PROJECT="gpt-neo-1.3B-dutch"
 # Variables for training the tokenizer and creating the config
 export VOCAB_SIZE="50257"
 export DATASET="yhavinga/mc4_nl_cleaned" # Name of the dataset in the Huggingface Hub
-export DATASET_CONFIG="tiny" # Config of the dataset in the Huggingface Hub
 export DATASET_SPLIT="train" # Split to use for training tokenizer and model
 export TEXT_FIELD="text" # Field containing the text to be used for training
 export CONFIG_TYPE="EleutherAI/gpt-neo-1.3B" # Config that our model will use
 export MODEL_PATH="${HOME}/data/${HF_PROJECT}" # Path to the model, e.g. here inside the mount
 python run_clm_flax.py \
     --output_dir="${MODEL_PATH}" \
     --model_type="gpt_neo" \
     --config_name="${MODEL_PATH}" \
     --tokenizer_name="${MODEL_PATH}" \
     --preprocessing_num_workers="96" \
     --do_train --do_eval \
     --dataset_name="${DATASET}" \
     --dataset_config_name="${DATASET_CONFIG}" \
     --block_size="512" \
-    --per_device_train_batch_size="8" \
-    --per_device_eval_batch_size="8" \
-    --learning_rate="0.0005" --warmup_steps="5000" \
     --adafactor \
     --overwrite_output_dir \
     --num_train_epochs="1" \
     --logging_steps="500" \
-    --save_steps="10000" \
-    --eval_steps="2500"
 #     \
 #    --push_to_hub
 #    --adam_beta1="0.9" --adam_beta2="0.98" --weight_decay="0.01" \

 # Variables for training the tokenizer and creating the config
 export VOCAB_SIZE="50257"
 export DATASET="yhavinga/mc4_nl_cleaned" # Name of the dataset in the Huggingface Hub
+export DATASET_CONFIG="large" # Config of the dataset in the Huggingface Hub
 export DATASET_SPLIT="train" # Split to use for training tokenizer and model
 export TEXT_FIELD="text" # Field containing the text to be used for training
 export CONFIG_TYPE="EleutherAI/gpt-neo-1.3B" # Config that our model will use
 export MODEL_PATH="${HOME}/data/${HF_PROJECT}" # Path to the model, e.g. here inside the mount
 python run_clm_flax.py \
     --output_dir="${MODEL_PATH}" \
     --model_type="gpt_neo" \
     --config_name="${MODEL_PATH}" \
+    --model_name_or_path="${MODEL_PATH}" \
     --tokenizer_name="${MODEL_PATH}" \
     --preprocessing_num_workers="96" \
     --do_train --do_eval \
     --dataset_name="${DATASET}" \
     --dataset_config_name="${DATASET_CONFIG}" \
     --block_size="512" \
+    --per_device_train_batch_size="2" \
+    --per_device_eval_batch_size="2" \
+    --learning_rate="0.0005" \
+    --warmup_steps="5000" \
     --adafactor \
     --overwrite_output_dir \
     --num_train_epochs="1" \
     --logging_steps="500" \
+    --save_steps="20000" \
+    --eval_steps="5000"
 #     \
 #    --push_to_hub
 #    --adam_beta1="0.9" --adam_beta2="0.98" --weight_decay="0.01" \
+#    --learning_rate="0.0005" --warmup_steps="5000" \

runs/events.out.tfevents.1641116702.t1v-n-2f64d7c8-w-0.151740.0.v2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb5f45ffc186250657cd42a837e4697912bd59a51de9216c7012dbb08dcd7c85
+size 956608

runs/events.out.tfevents.1641125986.t1v-n-2f64d7c8-w-0.164072.0.v2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:47fc30d1dfda8812fd6ea2b7e10f02db18885492aaa1eb87211edef70e496f8b
+size 1839862

runs/events.out.tfevents.1641156371.t1v-n-2f64d7c8-w-0.13342.0.v2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:1f4ea05e3c57e06d5f3dd56cb928fa56afd6f58867454ec0d9aeecf8a0ee83f8
+size 28682045