Training in progress, step 1000

Browse files

Files changed (8) hide show

config.json +4 -4
evalonlyhindi_indicwav2vec_MUCS_warmup500_s300shuff100_2142429.out +40 -0
indicwav2vec_MUCS_warmup500_s300shuff100_2143522.out +0 -0
language_segregated_prediction_texts/evalpredictions_hindi_indicw2v_ad0_3_hd_02_featd_0_2_lr6e-4_warmup2000_s300_shuf500.txt +0 -0
language_segregated_prediction_texts/evalpredictions_hindi_indicw2v_ad0_3_hd_02_featd_0_2_lr6e-4_warmup2000_s400_shuf42.txt +0 -0
model.safetensors +1 -1
predictions_indicw2v_ad0_3_hd_02_featd_0_2_lr6e-4_warmup500_s300_shuff100.txt +0 -0
training_args.bin +1 -1

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "/scratch/elec/puhe/p/palp3/MUCS/indicwav2vec_outputs/pd_warmup_500/s300_shuff100",
   "activation_dropout": 0.0,
   "adapter_attn_dim": null,
   "adapter_kernel_size": 3,
@@ -9,7 +9,7 @@
   "architectures": [
     "Wav2Vec2ForCTC"
   ],
-  "attention_dropout": 0.0,
   "bos_token_id": 1,
   "classifier_proj_size": 256,
   "codevector_dim": 256,
@@ -50,11 +50,11 @@
   "feat_extract_activation": "gelu",
   "feat_extract_dropout": 0.0,
   "feat_extract_norm": "layer",
-  "feat_proj_dropout": 0.0,
   "feat_quantizer_dropout": 0.0,
   "final_dropout": 0.0,
   "hidden_act": "gelu",
-  "hidden_dropout": 0.0,
   "hidden_dropout_prob": 0.1,
   "hidden_size": 1024,
   "initializer_range": 0.02,

 {
+  "_name_or_path": "/m/triton/scratch/elec/puhe/p/palp3/MUCS/indicwav2vec-hindi",
   "activation_dropout": 0.0,
   "adapter_attn_dim": null,
   "adapter_kernel_size": 3,
   "architectures": [
     "Wav2Vec2ForCTC"
   ],
+  "attention_dropout": 0.3,
   "bos_token_id": 1,
   "classifier_proj_size": 256,
   "codevector_dim": 256,
   "feat_extract_activation": "gelu",
   "feat_extract_dropout": 0.0,
   "feat_extract_norm": "layer",
+  "feat_proj_dropout": 0.3,
   "feat_quantizer_dropout": 0.0,
   "final_dropout": 0.0,
   "hidden_act": "gelu",
+  "hidden_dropout": 0.2,
   "hidden_dropout_prob": 0.1,
   "hidden_size": 1024,
   "initializer_range": 0.02,

evalonlyhindi_indicwav2vec_MUCS_warmup500_s300shuff100_2142429.out CHANGED Viewed

@@ -153,3 +153,43 @@ last prediction string
   eval_steps_per_second       =      1.164
   eval_wer                    =        1.0

   eval_steps_per_second       =      1.164
   eval_wer                    =        1.0
+wandb: - 0.005 MB of 0.005 MB uploaded
+wandb: Run history:
+wandb:                    eval/cer ▁
+wandb: eval/model_preparation_time ▁
+wandb:                eval/runtime ▁
+wandb:     eval/samples_per_second ▁
+wandb:       eval/steps_per_second ▁
+wandb:                    eval/wer ▁
+wandb:                    eval_cer ▁
+wandb: eval_model_preparation_time ▁
+wandb:                eval_runtime ▁
+wandb:                eval_samples ▁
+wandb:     eval_samples_per_second ▁
+wandb:       eval_steps_per_second ▁
+wandb:                    eval_wer ▁
+wandb:           train/global_step ▁▁
+wandb:
+wandb: Run summary:
+wandb:                    eval/cer 1.0
+wandb:                   eval/loss nan
+wandb: eval/model_preparation_time 0.0045
+wandb:                eval/runtime 30.9217
+wandb:     eval/samples_per_second 18.498
+wandb:       eval/steps_per_second 1.164
+wandb:                    eval/wer 1.0
+wandb:                    eval_cer 1.0
+wandb:                   eval_loss nan
+wandb: eval_model_preparation_time 0.0045
+wandb:                eval_runtime 30.9217
+wandb:                eval_samples 572
+wandb:     eval_samples_per_second 18.498
+wandb:       eval_steps_per_second 1.164
+wandb:                    eval_wer 1.0
+wandb:           train/global_step 0
+wandb:
+wandb: 🚀 View run eval_pd2000_s300_shuff100_hindi at: https://wandb.ai/priyanshipal/huggingface/runs/64250v6u
+wandb: ⭐️ View project at: https://wandb.ai/priyanshipal/huggingface
+wandb: Synced 6 W&B file(s), 0 media file(s), 0 artifact file(s) and 0 other file(s)
+wandb: Find logs at: ./wandb/run-20240822_152047-64250v6u/logs
+wandb: WARNING The new W&B backend becomes opt-out in version 0.18.0; try it out with `wandb.require("core")`! See https://wandb.me/wandb-core for more information.

indicwav2vec_MUCS_warmup500_s300shuff100_2143522.out ADDED Viewed

The diff for this file is too large to render. See raw diff

language_segregated_prediction_texts/evalpredictions_hindi_indicw2v_ad0_3_hd_02_featd_0_2_lr6e-4_warmup2000_s300_shuf500.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

language_segregated_prediction_texts/evalpredictions_hindi_indicw2v_ad0_3_hd_02_featd_0_2_lr6e-4_warmup2000_s400_shuf42.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6d6e542b15e77cd1bb8a7693945d939d7b6324a0178a2a54a151c7870a9a3a70
 size 1262426580

 version https://git-lfs.github.com/spec/v1
+oid sha256:08de7da709cb1c87182ea525062fcd525beeade5ce32613467ec0bcc59e40f04
 size 1262426580

predictions_indicw2v_ad0_3_hd_02_featd_0_2_lr6e-4_warmup500_s300_shuff100.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:17f546c82c9065a6469d28f2bf552ce06c87b07db0f04de15435295aa0a8a04d
 size 5432

 version https://git-lfs.github.com/spec/v1
+oid sha256:6414775e5e3dbcfd7bebd7f7c9e2b10fb4f3cb3532a487bef20431df5d198f8a
 size 5432