Marcos12886 commited on Sep 8

Commit

b73f096

•

1 Parent(s): c9c4a3f

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

README.md +28 -32
checkpoint-121/model.safetensors +1 -1
checkpoint-121/optimizer.pt +1 -1
checkpoint-121/scheduler.pt +1 -1
checkpoint-121/trainer_state.json +43 -43
checkpoint-121/training_args.bin +1 -1
checkpoint-145/config.json +85 -0
checkpoint-145/model.safetensors +3 -0
checkpoint-145/optimizer.pt +3 -0
checkpoint-145/rng_state.pth +3 -0
checkpoint-145/scheduler.pt +3 -0
checkpoint-145/trainer_state.json +114 -0
checkpoint-145/training_args.bin +3 -0
checkpoint-169/config.json +85 -0
checkpoint-169/model.safetensors +3 -0
checkpoint-169/optimizer.pt +3 -0
checkpoint-169/rng_state.pth +3 -0
checkpoint-169/scheduler.pt +3 -0
checkpoint-169/trainer_state.json +126 -0
checkpoint-169/training_args.bin +3 -0
checkpoint-194/config.json +85 -0
checkpoint-194/model.safetensors +3 -0
checkpoint-194/optimizer.pt +3 -0
checkpoint-194/rng_state.pth +3 -0
checkpoint-194/scheduler.pt +3 -0
checkpoint-194/trainer_state.json +138 -0
checkpoint-194/training_args.bin +3 -0
checkpoint-218/config.json +85 -0
checkpoint-218/model.safetensors +3 -0
checkpoint-218/optimizer.pt +3 -0
checkpoint-218/rng_state.pth +3 -0
checkpoint-218/scheduler.pt +3 -0
checkpoint-218/trainer_state.json +150 -0
checkpoint-218/training_args.bin +3 -0
checkpoint-24/model.safetensors +1 -1
checkpoint-24/optimizer.pt +1 -1
checkpoint-24/rng_state.pth +1 -1
checkpoint-24/scheduler.pt +1 -1
checkpoint-24/trainer_state.json +13 -13
checkpoint-24/training_args.bin +1 -1
checkpoint-242/config.json +85 -0
checkpoint-242/model.safetensors +3 -0
checkpoint-242/optimizer.pt +3 -0
checkpoint-242/rng_state.pth +3 -0
checkpoint-242/scheduler.pt +3 -0
checkpoint-242/trainer_state.json +162 -0
checkpoint-242/training_args.bin +3 -0
checkpoint-266/config.json +85 -0
checkpoint-266/model.safetensors +3 -0
checkpoint-266/optimizer.pt +3 -0

README.md CHANGED Viewed

@@ -4,26 +4,14 @@ license: apache-2.0
 base_model: ntu-spml/distilhubert
 tags:
 - generated_from_trainer
-datasets:
-- audiofolder
 metrics:
 - accuracy
 model-index:
 - name: distilhubert-finetuned-mixed-data
-  results:
-  - task:
-      name: Audio Classification
-      type: audio-classification
-    dataset:
-      name: audiofolder
-      type: audiofolder
-      config: default
-      split: train
-      args: default
-    metrics:
-    - name: Accuracy
-      type: accuracy
-      value: 0.8691275167785235
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -31,10 +19,13 @@ should probably proofread and complete it, then remove this comment. -->
 # distilhubert-finetuned-mixed-data
-This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on the audiofolder dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.3360
-- Accuracy: 0.8691
 ## Model description
@@ -61,25 +52,30 @@ The following hyperparameters were used during training:
 - total_train_batch_size: 64
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
-- lr_scheduler_warmup_ratio: 0.001
-- num_epochs: 7
 ### Training results
-| Training Loss | Epoch  | Step | Validation Loss | Accuracy |
-|:-------------:|:------:|:----:|:---------------:|:--------:|
-| No log        | 0.9664 | 18   | 0.6860          | 0.7584   |
-| No log        | 1.9866 | 37   | 0.4623          | 0.8020   |
-| No log        | 2.9530 | 55   | 0.4069          | 0.8188   |
-| No log        | 3.9732 | 74   | 0.3811          | 0.8356   |
-| No log        | 4.9933 | 93   | 0.3542          | 0.8356   |
-| No log        | 5.9597 | 111  | 0.3380          | 0.8658   |
-| No log        | 6.7651 | 126  | 0.3360          | 0.8691   |
 ### Framework versions
 - Transformers 4.44.2
-- Pytorch 2.4.0+cu121
-- Datasets 2.21.0
 - Tokenizers 0.19.1

 base_model: ntu-spml/distilhubert
 tags:
 - generated_from_trainer
 metrics:
 - accuracy
+- precision
+- recall
+- f1
 model-index:
 - name: distilhubert-finetuned-mixed-data
+  results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # distilhubert-finetuned-mixed-data
+This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.4765
+- Accuracy: 0.8475
+- Precision: 0.8497
+- Recall: 0.8475
+- F1: 0.8484
 ## Model description
 - total_train_batch_size: 64
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
+- lr_scheduler_warmup_ratio: 0.01
+- num_epochs: 15
 ### Training results
+| Training Loss | Epoch   | Step | Validation Loss | Accuracy | Precision | Recall | F1     |
+|:-------------:|:-------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|
+| No log        | 0.9897  | 24   | 0.9809          | 0.6357   | 0.5920    | 0.6357 | 0.5921 |
+| No log        | 1.9794  | 48   | 0.7444          | 0.7158   | 0.6992    | 0.7158 | 0.6905 |
+| No log        | 2.9691  | 72   | 0.6172          | 0.7494   | 0.7438    | 0.7494 | 0.7449 |
+| No log        | 4.0     | 97   | 0.5431          | 0.7984   | 0.7918    | 0.7984 | 0.7874 |
+| No log        | 4.9897  | 121  | 0.5269          | 0.8010   | 0.8006    | 0.8010 | 0.7975 |
+| No log        | 5.9794  | 145  | 0.5811          | 0.7494   | 0.7802    | 0.7494 | 0.7551 |
+| No log        | 6.9691  | 169  | 0.4408          | 0.8398   | 0.8366    | 0.8398 | 0.8355 |
+| No log        | 8.0     | 194  | 0.4687          | 0.8191   | 0.8188    | 0.8191 | 0.8168 |
+| No log        | 8.9897  | 218  | 0.4364          | 0.8475   | 0.8483    | 0.8475 | 0.8474 |
+| No log        | 9.9794  | 242  | 0.4291          | 0.8579   | 0.8561    | 0.8579 | 0.8568 |
+| No log        | 10.9691 | 266  | 0.4699          | 0.8501   | 0.8582    | 0.8501 | 0.8528 |
+| No log        | 12.0    | 291  | 0.4862          | 0.8450   | 0.8536    | 0.8450 | 0.8480 |
+| No log        | 12.9897 | 315  | 0.4765          | 0.8475   | 0.8497    | 0.8475 | 0.8484 |
 ### Framework versions
 - Transformers 4.44.2
+- Pytorch 2.4.1+cu121
 - Tokenizers 0.19.1

checkpoint-121/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9f17cc1a80f9cdf7f1c5c94c70062ca59ee73223709355f94eae716447e99d02
 size 94765560

 version https://git-lfs.github.com/spec/v1
+oid sha256:61738703583616f26bc5974045f101b4badf661cb1bd5759b55ffedbf42f8309
 size 94765560

checkpoint-121/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:af430e7b5cbd26cc609cc5c918049ec696a387c13101b4292d1bd68dd2695f0e
 size 189556666

 version https://git-lfs.github.com/spec/v1
+oid sha256:a04d7aa37706181567dea5d9c17d0a79ae70a3f43b546fd604def5a5c896f325
 size 189556666

checkpoint-121/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:192b51d0f1e5456c85d7a6eeae550a33132f97495282fa7f439444f5f22297cf
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:5c4a0a93ff2c02ad8dfec37403a0eff289573d406127ab0a60fb4386bc8bcb2b
 size 1064

checkpoint-121/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.7648578811369509,
   "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-121",
   "epoch": 4.989690721649485,
   "eval_steps": 500,
@@ -10,69 +10,69 @@
   "log_history": [
     {
       "epoch": 0.9896907216494846,
-      "eval_accuracy": 0.6098191214470284,
-      "eval_f1": 0.5527821682108387,
-      "eval_loss": 1.0193405151367188,
-      "eval_precision": 0.7003292379638224,
-      "eval_recall": 0.6098191214470284,
-      "eval_runtime": 1.7319,
-      "eval_samples_per_second": 223.453,
-      "eval_steps_per_second": 28.293,
       "step": 24
     },
     {
       "epoch": 1.9793814432989691,
-      "eval_accuracy": 0.6795865633074936,
-      "eval_f1": 0.6650515718181741,
-      "eval_loss": 0.7780925631523132,
-      "eval_precision": 0.6877908327609833,
-      "eval_recall": 0.6795865633074936,
-      "eval_runtime": 1.7105,
-      "eval_samples_per_second": 226.247,
-      "eval_steps_per_second": 28.646,
       "step": 48
     },
     {
       "epoch": 2.9690721649484537,
-      "eval_accuracy": 0.7260981912144703,
-      "eval_f1": 0.7125387559196679,
-      "eval_loss": 0.663092315196991,
-      "eval_precision": 0.7236217153897081,
-      "eval_recall": 0.7260981912144703,
-      "eval_runtime": 1.7131,
-      "eval_samples_per_second": 225.911,
-      "eval_steps_per_second": 28.604,
       "step": 72
     },
     {
       "epoch": 4.0,
-      "eval_accuracy": 0.7493540051679587,
-      "eval_f1": 0.7323843170610034,
-      "eval_loss": 0.5870956778526306,
-      "eval_precision": 0.7505520883603423,
-      "eval_recall": 0.7493540051679587,
-      "eval_runtime": 1.7332,
-      "eval_samples_per_second": 223.293,
-      "eval_steps_per_second": 28.272,
       "step": 97
     },
     {
       "epoch": 4.989690721649485,
-      "eval_accuracy": 0.7648578811369509,
-      "eval_f1": 0.7570271532827265,
-      "eval_loss": 0.5548774003982544,
-      "eval_precision": 0.7717080207133444,
-      "eval_recall": 0.7648578811369509,
-      "eval_runtime": 1.744,
-      "eval_samples_per_second": 221.907,
-      "eval_steps_per_second": 28.097,
       "step": 121
     }
   ],
   "logging_steps": 500,
-  "max_steps": 144,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 6,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {

 {
+  "best_metric": 0.8010335917312662,
   "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-121",
   "epoch": 4.989690721649485,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.9896907216494846,
+      "eval_accuracy": 0.6356589147286822,
+      "eval_f1": 0.5920563016978556,
+      "eval_loss": 0.980873703956604,
+      "eval_precision": 0.5920482291587493,
+      "eval_recall": 0.6356589147286822,
+      "eval_runtime": 1.6668,
+      "eval_samples_per_second": 232.175,
+      "eval_steps_per_second": 29.397,
       "step": 24
     },
     {
       "epoch": 1.9793814432989691,
+      "eval_accuracy": 0.7157622739018088,
+      "eval_f1": 0.6905410405322238,
+      "eval_loss": 0.7444477081298828,
+      "eval_precision": 0.6992377248989063,
+      "eval_recall": 0.7157622739018088,
+      "eval_runtime": 1.6941,
+      "eval_samples_per_second": 228.443,
+      "eval_steps_per_second": 28.924,
       "step": 48
     },
     {
       "epoch": 2.9690721649484537,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.744898505571463,
+      "eval_loss": 0.6171658039093018,
+      "eval_precision": 0.7437592422989429,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6943,
+      "eval_samples_per_second": 228.408,
+      "eval_steps_per_second": 28.92,
       "step": 72
     },
     {
       "epoch": 4.0,
+      "eval_accuracy": 0.7984496124031008,
+      "eval_f1": 0.7873621619744228,
+      "eval_loss": 0.5430988073348999,
+      "eval_precision": 0.79180344284319,
+      "eval_recall": 0.7984496124031008,
+      "eval_runtime": 1.7027,
+      "eval_samples_per_second": 227.289,
+      "eval_steps_per_second": 28.778,
       "step": 97
     },
     {
       "epoch": 4.989690721649485,
+      "eval_accuracy": 0.8010335917312662,
+      "eval_f1": 0.7974946178390901,
+      "eval_loss": 0.5268548130989075,
+      "eval_precision": 0.8005965453214461,
+      "eval_recall": 0.8010335917312662,
+      "eval_runtime": 1.6829,
+      "eval_samples_per_second": 229.957,
+      "eval_steps_per_second": 29.116,
       "step": 121
     }
   ],
   "logging_steps": 500,
+  "max_steps": 360,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 15,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {

checkpoint-121/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f758b94689e09a814f1948cbbce56e483b2b53509b111e749d1961a9e2d3ad45
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:347144964cf2be899f8dce858b11b47f463178200e095ec0ecada560c69f675a
 size 5240

checkpoint-145/config.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "finetuning_task": "audio-classification",
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_normal",
+    "1": "1s_pain",
+    "2": "1s_hunger",
+    "3": "1s_asphyxia"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": 3,
+    "1s_hunger": 2,
+    "1s_normal": 0,
+    "1s_pain": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-145/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62b1cac8d8be6152086485540750316f43a58660bddd11c298bb50d0f3f5f531
+size 94765560

checkpoint-145/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f74fa4c7ca2e76ec752e5b913444b39e61cef0b5760afb453b5c55805b47cacc
+size 189556666

checkpoint-145/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0867bb3588983088e1ae19ae31c54b18cd181442273a375c356a0362c53a9a5
+size 14308

checkpoint-145/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:62e2160d5bd28532b533e3efabec8ccad052eb12401ff324f1c912ac3e74c929
+size 1064

checkpoint-145/trainer_state.json ADDED Viewed

	@@ -0,0 +1,114 @@

+{
+  "best_metric": 0.8010335917312662,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-121",
+  "epoch": 5.979381443298969,
+  "eval_steps": 500,
+  "global_step": 145,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9896907216494846,
+      "eval_accuracy": 0.6356589147286822,
+      "eval_f1": 0.5920563016978556,
+      "eval_loss": 0.980873703956604,
+      "eval_precision": 0.5920482291587493,
+      "eval_recall": 0.6356589147286822,
+      "eval_runtime": 1.6668,
+      "eval_samples_per_second": 232.175,
+      "eval_steps_per_second": 29.397,
+      "step": 24
+    },
+    {
+      "epoch": 1.9793814432989691,
+      "eval_accuracy": 0.7157622739018088,
+      "eval_f1": 0.6905410405322238,
+      "eval_loss": 0.7444477081298828,
+      "eval_precision": 0.6992377248989063,
+      "eval_recall": 0.7157622739018088,
+      "eval_runtime": 1.6941,
+      "eval_samples_per_second": 228.443,
+      "eval_steps_per_second": 28.924,
+      "step": 48
+    },
+    {
+      "epoch": 2.9690721649484537,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.744898505571463,
+      "eval_loss": 0.6171658039093018,
+      "eval_precision": 0.7437592422989429,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6943,
+      "eval_samples_per_second": 228.408,
+      "eval_steps_per_second": 28.92,
+      "step": 72
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.7984496124031008,
+      "eval_f1": 0.7873621619744228,
+      "eval_loss": 0.5430988073348999,
+      "eval_precision": 0.79180344284319,
+      "eval_recall": 0.7984496124031008,
+      "eval_runtime": 1.7027,
+      "eval_samples_per_second": 227.289,
+      "eval_steps_per_second": 28.778,
+      "step": 97
+    },
+    {
+      "epoch": 4.989690721649485,
+      "eval_accuracy": 0.8010335917312662,
+      "eval_f1": 0.7974946178390901,
+      "eval_loss": 0.5268548130989075,
+      "eval_precision": 0.8005965453214461,
+      "eval_recall": 0.8010335917312662,
+      "eval_runtime": 1.6829,
+      "eval_samples_per_second": 229.957,
+      "eval_steps_per_second": 29.116,
+      "step": 121
+    },
+    {
+      "epoch": 5.979381443298969,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.7551329793037762,
+      "eval_loss": 0.5810549259185791,
+      "eval_precision": 0.7802262423287315,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6999,
+      "eval_samples_per_second": 227.658,
+      "eval_steps_per_second": 28.825,
+      "step": 145
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 360,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 15,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.10820802112e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-145/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:347144964cf2be899f8dce858b11b47f463178200e095ec0ecada560c69f675a
+size 5240

checkpoint-169/config.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "finetuning_task": "audio-classification",
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_normal",
+    "1": "1s_pain",
+    "2": "1s_hunger",
+    "3": "1s_asphyxia"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": 3,
+    "1s_hunger": 2,
+    "1s_normal": 0,
+    "1s_pain": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-169/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:052c2fac14563eb5b0b53eb4a3f6509d46dcf61f99ea7c0e5e76df5345230eff
+size 94765560

checkpoint-169/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:672db33956055547a36f8f888cdb0f8124de62210906cbe58b87898baf646fe9
+size 189556666

checkpoint-169/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b3d85d4b435d4ac4552bb46f32d5f63a55dbc65baaa5af6a14b6b39e968f4b8e
+size 14308

checkpoint-169/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a897dacc1b915150336aff74c1f17b3b8504d76168703307724c32fe3bca6896
+size 1064

checkpoint-169/trainer_state.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "best_metric": 0.8397932816537468,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-169",
+  "epoch": 6.969072164948454,
+  "eval_steps": 500,
+  "global_step": 169,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9896907216494846,
+      "eval_accuracy": 0.6356589147286822,
+      "eval_f1": 0.5920563016978556,
+      "eval_loss": 0.980873703956604,
+      "eval_precision": 0.5920482291587493,
+      "eval_recall": 0.6356589147286822,
+      "eval_runtime": 1.6668,
+      "eval_samples_per_second": 232.175,
+      "eval_steps_per_second": 29.397,
+      "step": 24
+    },
+    {
+      "epoch": 1.9793814432989691,
+      "eval_accuracy": 0.7157622739018088,
+      "eval_f1": 0.6905410405322238,
+      "eval_loss": 0.7444477081298828,
+      "eval_precision": 0.6992377248989063,
+      "eval_recall": 0.7157622739018088,
+      "eval_runtime": 1.6941,
+      "eval_samples_per_second": 228.443,
+      "eval_steps_per_second": 28.924,
+      "step": 48
+    },
+    {
+      "epoch": 2.9690721649484537,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.744898505571463,
+      "eval_loss": 0.6171658039093018,
+      "eval_precision": 0.7437592422989429,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6943,
+      "eval_samples_per_second": 228.408,
+      "eval_steps_per_second": 28.92,
+      "step": 72
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.7984496124031008,
+      "eval_f1": 0.7873621619744228,
+      "eval_loss": 0.5430988073348999,
+      "eval_precision": 0.79180344284319,
+      "eval_recall": 0.7984496124031008,
+      "eval_runtime": 1.7027,
+      "eval_samples_per_second": 227.289,
+      "eval_steps_per_second": 28.778,
+      "step": 97
+    },
+    {
+      "epoch": 4.989690721649485,
+      "eval_accuracy": 0.8010335917312662,
+      "eval_f1": 0.7974946178390901,
+      "eval_loss": 0.5268548130989075,
+      "eval_precision": 0.8005965453214461,
+      "eval_recall": 0.8010335917312662,
+      "eval_runtime": 1.6829,
+      "eval_samples_per_second": 229.957,
+      "eval_steps_per_second": 29.116,
+      "step": 121
+    },
+    {
+      "epoch": 5.979381443298969,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.7551329793037762,
+      "eval_loss": 0.5810549259185791,
+      "eval_precision": 0.7802262423287315,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6999,
+      "eval_samples_per_second": 227.658,
+      "eval_steps_per_second": 28.825,
+      "step": 145
+    },
+    {
+      "epoch": 6.969072164948454,
+      "eval_accuracy": 0.8397932816537468,
+      "eval_f1": 0.8354840008265724,
+      "eval_loss": 0.44080850481987,
+      "eval_precision": 0.8365717854569443,
+      "eval_recall": 0.8397932816537468,
+      "eval_runtime": 1.6785,
+      "eval_samples_per_second": 230.56,
+      "eval_steps_per_second": 29.192,
+      "step": 169
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 360,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 15,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.45957602464e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-169/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:347144964cf2be899f8dce858b11b47f463178200e095ec0ecada560c69f675a
+size 5240

checkpoint-194/config.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "finetuning_task": "audio-classification",
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_normal",
+    "1": "1s_pain",
+    "2": "1s_hunger",
+    "3": "1s_asphyxia"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": 3,
+    "1s_hunger": 2,
+    "1s_normal": 0,
+    "1s_pain": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-194/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d03ee65315496952ebb447ef8a2d41c18b1e5e1649887b43e9d670daab42cd79
+size 94765560

checkpoint-194/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:21b9a71b29339ce815e0272ac73c5e9382e8e4b94e000d00c2c15c46fcaf1bb1
+size 189556666

checkpoint-194/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3a98371a8e546887d8a0cf63952365049758fe889acd42fc72eb734ef3af0332
+size 14308

checkpoint-194/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6cf3f9f9e1b079187c143133062b7476177d05ae3b26e39797b7b8deffda481f
+size 1064

checkpoint-194/trainer_state.json ADDED Viewed

	@@ -0,0 +1,138 @@

+{
+  "best_metric": 0.8397932816537468,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-169",
+  "epoch": 8.0,
+  "eval_steps": 500,
+  "global_step": 194,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9896907216494846,
+      "eval_accuracy": 0.6356589147286822,
+      "eval_f1": 0.5920563016978556,
+      "eval_loss": 0.980873703956604,
+      "eval_precision": 0.5920482291587493,
+      "eval_recall": 0.6356589147286822,
+      "eval_runtime": 1.6668,
+      "eval_samples_per_second": 232.175,
+      "eval_steps_per_second": 29.397,
+      "step": 24
+    },
+    {
+      "epoch": 1.9793814432989691,
+      "eval_accuracy": 0.7157622739018088,
+      "eval_f1": 0.6905410405322238,
+      "eval_loss": 0.7444477081298828,
+      "eval_precision": 0.6992377248989063,
+      "eval_recall": 0.7157622739018088,
+      "eval_runtime": 1.6941,
+      "eval_samples_per_second": 228.443,
+      "eval_steps_per_second": 28.924,
+      "step": 48
+    },
+    {
+      "epoch": 2.9690721649484537,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.744898505571463,
+      "eval_loss": 0.6171658039093018,
+      "eval_precision": 0.7437592422989429,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6943,
+      "eval_samples_per_second": 228.408,
+      "eval_steps_per_second": 28.92,
+      "step": 72
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.7984496124031008,
+      "eval_f1": 0.7873621619744228,
+      "eval_loss": 0.5430988073348999,
+      "eval_precision": 0.79180344284319,
+      "eval_recall": 0.7984496124031008,
+      "eval_runtime": 1.7027,
+      "eval_samples_per_second": 227.289,
+      "eval_steps_per_second": 28.778,
+      "step": 97
+    },
+    {
+      "epoch": 4.989690721649485,
+      "eval_accuracy": 0.8010335917312662,
+      "eval_f1": 0.7974946178390901,
+      "eval_loss": 0.5268548130989075,
+      "eval_precision": 0.8005965453214461,
+      "eval_recall": 0.8010335917312662,
+      "eval_runtime": 1.6829,
+      "eval_samples_per_second": 229.957,
+      "eval_steps_per_second": 29.116,
+      "step": 121
+    },
+    {
+      "epoch": 5.979381443298969,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.7551329793037762,
+      "eval_loss": 0.5810549259185791,
+      "eval_precision": 0.7802262423287315,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6999,
+      "eval_samples_per_second": 227.658,
+      "eval_steps_per_second": 28.825,
+      "step": 145
+    },
+    {
+      "epoch": 6.969072164948454,
+      "eval_accuracy": 0.8397932816537468,
+      "eval_f1": 0.8354840008265724,
+      "eval_loss": 0.44080850481987,
+      "eval_precision": 0.8365717854569443,
+      "eval_recall": 0.8397932816537468,
+      "eval_runtime": 1.6785,
+      "eval_samples_per_second": 230.56,
+      "eval_steps_per_second": 29.192,
+      "step": 169
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.8191214470284238,
+      "eval_f1": 0.8167837576120855,
+      "eval_loss": 0.46871018409729004,
+      "eval_precision": 0.8187643627479353,
+      "eval_recall": 0.8191214470284238,
+      "eval_runtime": 1.6719,
+      "eval_samples_per_second": 231.477,
+      "eval_steps_per_second": 29.308,
+      "step": 194
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 360,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 15,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.81094402816e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-194/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:347144964cf2be899f8dce858b11b47f463178200e095ec0ecada560c69f675a
+size 5240

checkpoint-218/config.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "finetuning_task": "audio-classification",
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_normal",
+    "1": "1s_pain",
+    "2": "1s_hunger",
+    "3": "1s_asphyxia"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": 3,
+    "1s_hunger": 2,
+    "1s_normal": 0,
+    "1s_pain": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-218/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f22baf06235c468452afb48784bcfe17b8d6b16547f92c897a6b83b9d4be1927
+size 94765560

checkpoint-218/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b107c786ae699e053540620707226aced653806a534f7bf2c3d041d5a799d0d
+size 189556666

checkpoint-218/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:87f5981b8629d20da8d7bb452f1f8e311534ac9a1fbf9cf6ca9f99f281c14bfa
+size 14308

checkpoint-218/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e51016c1626b13f8e0c2274df9c63eb74ef480d103cd1eaea425e0978c8cf392
+size 1064

checkpoint-218/trainer_state.json ADDED Viewed

	@@ -0,0 +1,150 @@

+{
+  "best_metric": 0.8475452196382429,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-218",
+  "epoch": 8.989690721649485,
+  "eval_steps": 500,
+  "global_step": 218,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9896907216494846,
+      "eval_accuracy": 0.6356589147286822,
+      "eval_f1": 0.5920563016978556,
+      "eval_loss": 0.980873703956604,
+      "eval_precision": 0.5920482291587493,
+      "eval_recall": 0.6356589147286822,
+      "eval_runtime": 1.6668,
+      "eval_samples_per_second": 232.175,
+      "eval_steps_per_second": 29.397,
+      "step": 24
+    },
+    {
+      "epoch": 1.9793814432989691,
+      "eval_accuracy": 0.7157622739018088,
+      "eval_f1": 0.6905410405322238,
+      "eval_loss": 0.7444477081298828,
+      "eval_precision": 0.6992377248989063,
+      "eval_recall": 0.7157622739018088,
+      "eval_runtime": 1.6941,
+      "eval_samples_per_second": 228.443,
+      "eval_steps_per_second": 28.924,
+      "step": 48
+    },
+    {
+      "epoch": 2.9690721649484537,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.744898505571463,
+      "eval_loss": 0.6171658039093018,
+      "eval_precision": 0.7437592422989429,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6943,
+      "eval_samples_per_second": 228.408,
+      "eval_steps_per_second": 28.92,
+      "step": 72
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.7984496124031008,
+      "eval_f1": 0.7873621619744228,
+      "eval_loss": 0.5430988073348999,
+      "eval_precision": 0.79180344284319,
+      "eval_recall": 0.7984496124031008,
+      "eval_runtime": 1.7027,
+      "eval_samples_per_second": 227.289,
+      "eval_steps_per_second": 28.778,
+      "step": 97
+    },
+    {
+      "epoch": 4.989690721649485,
+      "eval_accuracy": 0.8010335917312662,
+      "eval_f1": 0.7974946178390901,
+      "eval_loss": 0.5268548130989075,
+      "eval_precision": 0.8005965453214461,
+      "eval_recall": 0.8010335917312662,
+      "eval_runtime": 1.6829,
+      "eval_samples_per_second": 229.957,
+      "eval_steps_per_second": 29.116,
+      "step": 121
+    },
+    {
+      "epoch": 5.979381443298969,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.7551329793037762,
+      "eval_loss": 0.5810549259185791,
+      "eval_precision": 0.7802262423287315,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6999,
+      "eval_samples_per_second": 227.658,
+      "eval_steps_per_second": 28.825,
+      "step": 145
+    },
+    {
+      "epoch": 6.969072164948454,
+      "eval_accuracy": 0.8397932816537468,
+      "eval_f1": 0.8354840008265724,
+      "eval_loss": 0.44080850481987,
+      "eval_precision": 0.8365717854569443,
+      "eval_recall": 0.8397932816537468,
+      "eval_runtime": 1.6785,
+      "eval_samples_per_second": 230.56,
+      "eval_steps_per_second": 29.192,
+      "step": 169
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.8191214470284238,
+      "eval_f1": 0.8167837576120855,
+      "eval_loss": 0.46871018409729004,
+      "eval_precision": 0.8187643627479353,
+      "eval_recall": 0.8191214470284238,
+      "eval_runtime": 1.6719,
+      "eval_samples_per_second": 231.477,
+      "eval_steps_per_second": 29.308,
+      "step": 194
+    },
+    {
+      "epoch": 8.989690721649485,
+      "eval_accuracy": 0.8475452196382429,
+      "eval_f1": 0.8473710740005564,
+      "eval_loss": 0.4363822937011719,
+      "eval_precision": 0.8483238707679635,
+      "eval_recall": 0.8475452196382429,
+      "eval_runtime": 1.6838,
+      "eval_samples_per_second": 229.835,
+      "eval_steps_per_second": 29.101,
+      "step": 218
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 360,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 15,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.16231203168e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-218/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:347144964cf2be899f8dce858b11b47f463178200e095ec0ecada560c69f675a
+size 5240

checkpoint-24/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68a1c8e7483216c3afd74e7c8f3bf326f08720513511c39fcdf37be7ae3a0552
 size 94765560

 version https://git-lfs.github.com/spec/v1
+oid sha256:2a3bee6833ba8b12da8d51850147bb3c3b153eec346dfd3b0fda4ff730aa9026
 size 94765560

checkpoint-24/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea879235e07d8970f1c22eb53e2c7884154e7269b0995315fa875740c3c99644
 size 189556666

 version https://git-lfs.github.com/spec/v1
+oid sha256:856d9a47a6db002c6e55d97a99db231cee10d1fef5c0909f7d527b86c30af746
 size 189556666

checkpoint-24/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1dfbead32b1c4ff8d1271c1899bd626bf08d46cbc21d2769431f03d7912b1368
 size 14308

 version https://git-lfs.github.com/spec/v1
+oid sha256:202bb63ca18cd0b022bafcf6cf19faa822d2e1dbc2cdaf6b5a9bdcbe21ca7562
 size 14308

checkpoint-24/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a3b5edb3a337b55456e10de8e5d582a8acbe41a6ddc5e0ffb6c3463e1e8bd89e
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:7a45410ab60db58a246b1af794984e39ea7655e4cee627c4cdfe5bd40727f72a
 size 1064

checkpoint-24/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.5193798449612403,
   "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-24",
   "epoch": 0.9896907216494846,
   "eval_steps": 500,
@@ -10,21 +10,21 @@
   "log_history": [
     {
       "epoch": 0.9896907216494846,
-      "eval_accuracy": 0.5193798449612403,
-      "eval_f1": 0.40212917110679286,
-      "eval_loss": 1.1225358247756958,
-      "eval_precision": 0.33630594789914475,
-      "eval_recall": 0.5193798449612403,
-      "eval_runtime": 1.6647,
-      "eval_samples_per_second": 232.47,
-      "eval_steps_per_second": 29.434,
       "step": 24
     }
   ],
   "logging_steps": 500,
-  "max_steps": 24,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
@@ -42,12 +42,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": true
       },
       "attributes": {}
     }
   },
-  "total_flos": 3493211996160000.0,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 0.6356589147286822,
   "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-24",
   "epoch": 0.9896907216494846,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.9896907216494846,
+      "eval_accuracy": 0.6356589147286822,
+      "eval_f1": 0.5920563016978556,
+      "eval_loss": 0.980873703956604,
+      "eval_precision": 0.5920482291587493,
+      "eval_recall": 0.6356589147286822,
+      "eval_runtime": 1.6668,
+      "eval_samples_per_second": 232.175,
+      "eval_steps_per_second": 29.397,
       "step": 24
     }
   ],
   "logging_steps": 500,
+  "max_steps": 360,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 15,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": false
       },
       "attributes": {}
     }
   },
+  "total_flos": 3513680035200000.0,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

checkpoint-24/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c712b343688a0deff84bdfb1bfec65a5350ebb13af4be1817584730c46e10303
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:347144964cf2be899f8dce858b11b47f463178200e095ec0ecada560c69f675a
 size 5240

checkpoint-242/config.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "finetuning_task": "audio-classification",
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_normal",
+    "1": "1s_pain",
+    "2": "1s_hunger",
+    "3": "1s_asphyxia"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": 3,
+    "1s_hunger": 2,
+    "1s_normal": 0,
+    "1s_pain": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-242/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2c3c3acfb39a1584bdad8c4452c6a99cc55d03b67d4754ef55bdc31be94eb5b7
+size 94765560

checkpoint-242/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:529f05dfd1fdfa07d440221559587dda8eded6dd4e7f89fd777f0ac7f24f5fee
+size 189556666

checkpoint-242/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e731e4993f8e25825c268c79f8c5e714e7bddf10c95d3c48fd5bec091ada0032
+size 14308

checkpoint-242/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:781bb61f6baa40042311c990cc82713d83cdc179ccb43dbb9cdd148961a2e8ad
+size 1064

checkpoint-242/trainer_state.json ADDED Viewed

	@@ -0,0 +1,162 @@

+{
+  "best_metric": 0.8578811369509044,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-242",
+  "epoch": 9.97938144329897,
+  "eval_steps": 500,
+  "global_step": 242,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9896907216494846,
+      "eval_accuracy": 0.6356589147286822,
+      "eval_f1": 0.5920563016978556,
+      "eval_loss": 0.980873703956604,
+      "eval_precision": 0.5920482291587493,
+      "eval_recall": 0.6356589147286822,
+      "eval_runtime": 1.6668,
+      "eval_samples_per_second": 232.175,
+      "eval_steps_per_second": 29.397,
+      "step": 24
+    },
+    {
+      "epoch": 1.9793814432989691,
+      "eval_accuracy": 0.7157622739018088,
+      "eval_f1": 0.6905410405322238,
+      "eval_loss": 0.7444477081298828,
+      "eval_precision": 0.6992377248989063,
+      "eval_recall": 0.7157622739018088,
+      "eval_runtime": 1.6941,
+      "eval_samples_per_second": 228.443,
+      "eval_steps_per_second": 28.924,
+      "step": 48
+    },
+    {
+      "epoch": 2.9690721649484537,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.744898505571463,
+      "eval_loss": 0.6171658039093018,
+      "eval_precision": 0.7437592422989429,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6943,
+      "eval_samples_per_second": 228.408,
+      "eval_steps_per_second": 28.92,
+      "step": 72
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.7984496124031008,
+      "eval_f1": 0.7873621619744228,
+      "eval_loss": 0.5430988073348999,
+      "eval_precision": 0.79180344284319,
+      "eval_recall": 0.7984496124031008,
+      "eval_runtime": 1.7027,
+      "eval_samples_per_second": 227.289,
+      "eval_steps_per_second": 28.778,
+      "step": 97
+    },
+    {
+      "epoch": 4.989690721649485,
+      "eval_accuracy": 0.8010335917312662,
+      "eval_f1": 0.7974946178390901,
+      "eval_loss": 0.5268548130989075,
+      "eval_precision": 0.8005965453214461,
+      "eval_recall": 0.8010335917312662,
+      "eval_runtime": 1.6829,
+      "eval_samples_per_second": 229.957,
+      "eval_steps_per_second": 29.116,
+      "step": 121
+    },
+    {
+      "epoch": 5.979381443298969,
+      "eval_accuracy": 0.7493540051679587,
+      "eval_f1": 0.7551329793037762,
+      "eval_loss": 0.5810549259185791,
+      "eval_precision": 0.7802262423287315,
+      "eval_recall": 0.7493540051679587,
+      "eval_runtime": 1.6999,
+      "eval_samples_per_second": 227.658,
+      "eval_steps_per_second": 28.825,
+      "step": 145
+    },
+    {
+      "epoch": 6.969072164948454,
+      "eval_accuracy": 0.8397932816537468,
+      "eval_f1": 0.8354840008265724,
+      "eval_loss": 0.44080850481987,
+      "eval_precision": 0.8365717854569443,
+      "eval_recall": 0.8397932816537468,
+      "eval_runtime": 1.6785,
+      "eval_samples_per_second": 230.56,
+      "eval_steps_per_second": 29.192,
+      "step": 169
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.8191214470284238,
+      "eval_f1": 0.8167837576120855,
+      "eval_loss": 0.46871018409729004,
+      "eval_precision": 0.8187643627479353,
+      "eval_recall": 0.8191214470284238,
+      "eval_runtime": 1.6719,
+      "eval_samples_per_second": 231.477,
+      "eval_steps_per_second": 29.308,
+      "step": 194
+    },
+    {
+      "epoch": 8.989690721649485,
+      "eval_accuracy": 0.8475452196382429,
+      "eval_f1": 0.8473710740005564,
+      "eval_loss": 0.4363822937011719,
+      "eval_precision": 0.8483238707679635,
+      "eval_recall": 0.8475452196382429,
+      "eval_runtime": 1.6838,
+      "eval_samples_per_second": 229.835,
+      "eval_steps_per_second": 29.101,
+      "step": 218
+    },
+    {
+      "epoch": 9.97938144329897,
+      "eval_accuracy": 0.8578811369509044,
+      "eval_f1": 0.8567532661685897,
+      "eval_loss": 0.42906680703163147,
+      "eval_precision": 0.8560504853170988,
+      "eval_recall": 0.8578811369509044,
+      "eval_runtime": 1.6875,
+      "eval_samples_per_second": 229.333,
+      "eval_steps_per_second": 29.037,
+      "step": 242
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 360,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 15,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.5136800352e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-242/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:347144964cf2be899f8dce858b11b47f463178200e095ec0ecada560c69f675a
+size 5240

checkpoint-266/config.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "finetuning_task": "audio-classification",
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_normal",
+    "1": "1s_pain",
+    "2": "1s_hunger",
+    "3": "1s_asphyxia"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": 3,
+    "1s_hunger": 2,
+    "1s_normal": 0,
+    "1s_pain": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-266/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b40af64761e85d5fea70c649217c8cc140a31cb9ca6b3839f952a2bb9f87e0b2
+size 94765560

checkpoint-266/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2157435343c02544baabe61713043b7b3749a01b1cc4aeeb2340f89faf040460
+size 189556666