Marcos12886 commited on Sep 1, 2024

Commit

969bb37

verified ·

1 Parent(s): e0f3ecc

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

README.md +105 -3
checkpoint-111/config.json +84 -0
checkpoint-111/model.safetensors +3 -0
checkpoint-111/optimizer.pt +3 -0
checkpoint-111/preprocessor_config.json +9 -0
checkpoint-111/rng_state.pth +3 -0
checkpoint-111/scheduler.pt +3 -0
checkpoint-111/trainer_state.json +114 -0
checkpoint-111/training_args.bin +3 -0
checkpoint-130/config.json +84 -0
checkpoint-130/model.safetensors +3 -0
checkpoint-130/optimizer.pt +3 -0
checkpoint-130/preprocessor_config.json +9 -0
checkpoint-130/rng_state.pth +3 -0
checkpoint-130/scheduler.pt +3 -0
checkpoint-130/trainer_state.json +126 -0
checkpoint-130/training_args.bin +3 -0
checkpoint-135/config.json +84 -0
checkpoint-135/model.safetensors +3 -0
checkpoint-135/optimizer.pt +3 -0
checkpoint-135/preprocessor_config.json +9 -0
checkpoint-135/rng_state.pth +3 -0
checkpoint-135/scheduler.pt +3 -0
checkpoint-135/trainer_state.json +60 -0
checkpoint-135/training_args.bin +3 -0
checkpoint-136/config.json +84 -0
checkpoint-136/model.safetensors +3 -0
checkpoint-136/optimizer.pt +3 -0
checkpoint-136/preprocessor_config.json +9 -0
checkpoint-136/rng_state.pth +3 -0
checkpoint-136/scheduler.pt +3 -0
checkpoint-136/trainer_state.json +60 -0
checkpoint-136/training_args.bin +3 -0
checkpoint-149/config.json +84 -0
checkpoint-149/model.safetensors +3 -0
checkpoint-149/optimizer.pt +3 -0
checkpoint-149/preprocessor_config.json +9 -0
checkpoint-149/rng_state.pth +3 -0
checkpoint-149/scheduler.pt +3 -0
checkpoint-149/trainer_state.json +138 -0
checkpoint-149/training_args.bin +3 -0
checkpoint-167/config.json +84 -0
checkpoint-167/model.safetensors +3 -0
checkpoint-167/optimizer.pt +3 -0
checkpoint-167/preprocessor_config.json +9 -0
checkpoint-167/rng_state.pth +3 -0
checkpoint-167/scheduler.pt +3 -0
checkpoint-167/trainer_state.json +150 -0
checkpoint-167/training_args.bin +3 -0
checkpoint-18/config.json +84 -0

README.md CHANGED Viewed

@@ -1,3 +1,105 @@
----
-license: apache-2.0
----

+---
+library_name: transformers
+license: apache-2.0
+base_model: ntu-spml/distilhubert
+tags:
+- generated_from_trainer
+datasets:
+- audiofolder
+metrics:
+- accuracy
+- f1
+- precision
+- recall
+model-index:
+- name: distilhubert-finetuned-mixed-data
+  results:
+  - task:
+      name: Audio Classification
+      type: audio-classification
+    dataset:
+      name: audiofolder
+      type: audiofolder
+      config: default
+      split: train
+      args: default
+    metrics:
+    - name: Accuracy
+      type: accuracy
+      value: 0.9026845637583892
+    - name: F1
+      type: f1
+      value: 0.9017814679012008
+    - name: Precision
+      type: precision
+      value: 0.901095676384633
+    - name: Recall
+      type: recall
+      value: 0.9026845637583892
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# distilhubert-finetuned-mixed-data
+This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on the audiofolder dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.2976
+- Accuracy: 0.9027
+- F1: 0.9018
+- Precision: 0.9011
+- Recall: 0.9027
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0001
+- train_batch_size: 8
+- eval_batch_size: 8
+- seed: 123
+- gradient_accumulation_steps: 8
+- total_train_batch_size: 64
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: cosine
+- lr_scheduler_warmup_ratio: 0.001
+- num_epochs: 12
+### Training results
+| Training Loss | Epoch   | Step | Validation Loss | Accuracy | F1     | Precision | Recall |
+|:-------------:|:-------:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|
+| No log        | 0.9664  | 18   | 0.6696          | 0.7819   | 0.7264 | 0.6898    | 0.7819 |
+| No log        | 1.9866  | 37   | 0.5068          | 0.7752   | 0.7203 | 0.6849    | 0.7752 |
+| No log        | 2.9530  | 55   | 0.4304          | 0.8087   | 0.7535 | 0.7242    | 0.8087 |
+| No log        | 3.9732  | 74   | 0.4109          | 0.8523   | 0.8434 | 0.8728    | 0.8523 |
+| No log        | 4.9933  | 93   | 0.3263          | 0.8725   | 0.8718 | 0.8719    | 0.8725 |
+| No log        | 5.9597  | 111  | 0.3036          | 0.8826   | 0.8824 | 0.8824    | 0.8826 |
+| No log        | 6.9799  | 130  | 0.3046          | 0.8893   | 0.8876 | 0.8892    | 0.8893 |
+| No log        | 8.0     | 149  | 0.3244          | 0.8758   | 0.8770 | 0.8787    | 0.8758 |
+| No log        | 8.9664  | 167  | 0.2962          | 0.9027   | 0.9018 | 0.9012    | 0.9027 |
+| No log        | 9.9866  | 186  | 0.2971          | 0.9027   | 0.9010 | 0.9014    | 0.9027 |
+| No log        | 10.9530 | 204  | 0.2974          | 0.9094   | 0.9082 | 0.9077    | 0.9094 |
+| No log        | 11.5973 | 216  | 0.2976          | 0.9027   | 0.9018 | 0.9011    | 0.9027 |
+### Framework versions
+- Transformers 4.44.2
+- Pytorch 2.4.0+cu121
+- Datasets 2.21.0
+- Tokenizers 0.19.1

checkpoint-111/config.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_asphyxia",
+    "1": "1s_hunger",
+    "2": "1s_normal",
+    "3": "1s_pain"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": "0",
+    "1s_hunger": "1",
+    "1s_normal": "2",
+    "1s_pain": "3"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-111/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8afb68ff2611e3603dee528e572e6fc36c40e47cec34c6ee683636922c8055e1
+size 94765560

checkpoint-111/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:105e2897a04f3a74cea8691093cd964cb3e2476cb37888e94bd97ac020d7bc23
+size 189556666

checkpoint-111/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-111/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:60f43e7fdf5def6846b069020fb2803b19ffc2aab112709cf440ff32a8a2bc9b
+size 14308

checkpoint-111/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd5bf82e806804b25d214305b99f2c178bc6f19a61f077621eaca5b3cb5523cd
+size 1064

checkpoint-111/trainer_state.json ADDED Viewed

	@@ -0,0 +1,114 @@

+{
+  "best_metric": 0.8825503355704698,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-111",
+  "epoch": 5.959731543624161,
+  "eval_steps": 500,
+  "global_step": 111,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9664429530201343,
+      "eval_accuracy": 0.7818791946308725,
+      "eval_f1": 0.7264205130236912,
+      "eval_loss": 0.669560968875885,
+      "eval_precision": 0.689807639599501,
+      "eval_recall": 0.7818791946308725,
+      "eval_runtime": 0.9033,
+      "eval_samples_per_second": 329.896,
+      "eval_steps_per_second": 42.067,
+      "step": 18
+    },
+    {
+      "epoch": 1.9865771812080537,
+      "eval_accuracy": 0.7751677852348994,
+      "eval_f1": 0.7202681570933687,
+      "eval_loss": 0.5067932605743408,
+      "eval_precision": 0.684911313518696,
+      "eval_recall": 0.7751677852348994,
+      "eval_runtime": 0.907,
+      "eval_samples_per_second": 328.546,
+      "eval_steps_per_second": 41.895,
+      "step": 37
+    },
+    {
+      "epoch": 2.953020134228188,
+      "eval_accuracy": 0.8087248322147651,
+      "eval_f1": 0.7535236037076262,
+      "eval_loss": 0.43038079142570496,
+      "eval_precision": 0.7241626365959,
+      "eval_recall": 0.8087248322147651,
+      "eval_runtime": 0.8664,
+      "eval_samples_per_second": 343.963,
+      "eval_steps_per_second": 43.861,
+      "step": 55
+    },
+    {
+      "epoch": 3.9731543624161074,
+      "eval_accuracy": 0.8523489932885906,
+      "eval_f1": 0.8433916249277822,
+      "eval_loss": 0.4109182059764862,
+      "eval_precision": 0.8727817866814688,
+      "eval_recall": 0.8523489932885906,
+      "eval_runtime": 0.8712,
+      "eval_samples_per_second": 342.059,
+      "eval_steps_per_second": 43.618,
+      "step": 74
+    },
+    {
+      "epoch": 4.993288590604027,
+      "eval_accuracy": 0.87248322147651,
+      "eval_f1": 0.8717711524765707,
+      "eval_loss": 0.3263051509857178,
+      "eval_precision": 0.8718521382399975,
+      "eval_recall": 0.87248322147651,
+      "eval_runtime": 0.87,
+      "eval_samples_per_second": 342.548,
+      "eval_steps_per_second": 43.681,
+      "step": 93
+    },
+    {
+      "epoch": 5.959731543624161,
+      "eval_accuracy": 0.8825503355704698,
+      "eval_f1": 0.8824400125399595,
+      "eval_loss": 0.3035907447338104,
+      "eval_precision": 0.8824270850226767,
+      "eval_recall": 0.8825503355704698,
+      "eval_runtime": 0.8921,
+      "eval_samples_per_second": 334.055,
+      "eval_steps_per_second": 42.598,
+      "step": 111
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 216,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 12,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.62379776384e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-111/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:296be9afae72ab3934d873f0cf92f87ef76899c18b11651de670afb49aa1a5d6
+size 5240

checkpoint-130/config.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_asphyxia",
+    "1": "1s_hunger",
+    "2": "1s_normal",
+    "3": "1s_pain"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": "0",
+    "1s_hunger": "1",
+    "1s_normal": "2",
+    "1s_pain": "3"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-130/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3274a950ef7996900990e6a908894c38407a87245d2e54fd2d49a70f893d18d7
+size 94765560

checkpoint-130/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:350d7e738f5a2fe60a4aaaa7bf1f954bab46678f8d6d6a8b53d70e92d336058a
+size 189556666

checkpoint-130/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-130/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:52ce1903887f6eefecdbafa965766c8b4e5f6264b39c386f85053529854ad6aa
+size 14308

checkpoint-130/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2c8f63f56197268202aa5b134a342d5425bd11184ac819d7eb62d725e5d31de3
+size 1064

checkpoint-130/trainer_state.json ADDED Viewed

	@@ -0,0 +1,126 @@

+{
+  "best_metric": 0.889261744966443,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-130",
+  "epoch": 6.97986577181208,
+  "eval_steps": 500,
+  "global_step": 130,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9664429530201343,
+      "eval_accuracy": 0.7818791946308725,
+      "eval_f1": 0.7264205130236912,
+      "eval_loss": 0.669560968875885,
+      "eval_precision": 0.689807639599501,
+      "eval_recall": 0.7818791946308725,
+      "eval_runtime": 0.9033,
+      "eval_samples_per_second": 329.896,
+      "eval_steps_per_second": 42.067,
+      "step": 18
+    },
+    {
+      "epoch": 1.9865771812080537,
+      "eval_accuracy": 0.7751677852348994,
+      "eval_f1": 0.7202681570933687,
+      "eval_loss": 0.5067932605743408,
+      "eval_precision": 0.684911313518696,
+      "eval_recall": 0.7751677852348994,
+      "eval_runtime": 0.907,
+      "eval_samples_per_second": 328.546,
+      "eval_steps_per_second": 41.895,
+      "step": 37
+    },
+    {
+      "epoch": 2.953020134228188,
+      "eval_accuracy": 0.8087248322147651,
+      "eval_f1": 0.7535236037076262,
+      "eval_loss": 0.43038079142570496,
+      "eval_precision": 0.7241626365959,
+      "eval_recall": 0.8087248322147651,
+      "eval_runtime": 0.8664,
+      "eval_samples_per_second": 343.963,
+      "eval_steps_per_second": 43.861,
+      "step": 55
+    },
+    {
+      "epoch": 3.9731543624161074,
+      "eval_accuracy": 0.8523489932885906,
+      "eval_f1": 0.8433916249277822,
+      "eval_loss": 0.4109182059764862,
+      "eval_precision": 0.8727817866814688,
+      "eval_recall": 0.8523489932885906,
+      "eval_runtime": 0.8712,
+      "eval_samples_per_second": 342.059,
+      "eval_steps_per_second": 43.618,
+      "step": 74
+    },
+    {
+      "epoch": 4.993288590604027,
+      "eval_accuracy": 0.87248322147651,
+      "eval_f1": 0.8717711524765707,
+      "eval_loss": 0.3263051509857178,
+      "eval_precision": 0.8718521382399975,
+      "eval_recall": 0.87248322147651,
+      "eval_runtime": 0.87,
+      "eval_samples_per_second": 342.548,
+      "eval_steps_per_second": 43.681,
+      "step": 93
+    },
+    {
+      "epoch": 5.959731543624161,
+      "eval_accuracy": 0.8825503355704698,
+      "eval_f1": 0.8824400125399595,
+      "eval_loss": 0.3035907447338104,
+      "eval_precision": 0.8824270850226767,
+      "eval_recall": 0.8825503355704698,
+      "eval_runtime": 0.8921,
+      "eval_samples_per_second": 334.055,
+      "eval_steps_per_second": 42.598,
+      "step": 111
+    },
+    {
+      "epoch": 6.97986577181208,
+      "eval_accuracy": 0.889261744966443,
+      "eval_f1": 0.8876321254746313,
+      "eval_loss": 0.3046204149723053,
+      "eval_precision": 0.8891935449502327,
+      "eval_recall": 0.889261744966443,
+      "eval_runtime": 0.894,
+      "eval_samples_per_second": 333.317,
+      "eval_steps_per_second": 42.504,
+      "step": 130
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 216,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 12,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.89443072448e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-130/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:296be9afae72ab3934d873f0cf92f87ef76899c18b11651de670afb49aa1a5d6
+size 5240

checkpoint-135/config.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_pain",
+    "1": "1s_normal",
+    "2": "1s_asphyxia",
+    "3": "1s_hunger"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": "2",
+    "1s_hunger": "3",
+    "1s_normal": "1",
+    "1s_pain": "0"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-135/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9b04e455cb28d03199ae0547ed3d379f784d8b87502f896e8601b3a6dbbf5ed5
+size 94765560

checkpoint-135/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff0a3920a3219c17d5246c0b0cc4d972ce476ded5ff479d1851bfa1e197f3c7d
+size 189556666

checkpoint-135/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-135/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c76852e73dfcd3d0470d5a6ce48f93321160ffa41866b87f241dcdf4dc19c2da
+size 14244

checkpoint-135/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e1a799a5fee1cd04ce0f342f7f115c3a396839d512d5eace9370b47e189b3242
+size 1064

checkpoint-135/trainer_state.json ADDED Viewed

	@@ -0,0 +1,60 @@

+{
+  "best_metric": 0.8301435406698564,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-135",
+  "epoch": 2.958904109589041,
+  "eval_steps": 500,
+  "global_step": 135,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9863013698630136,
+      "eval_accuracy": 0.777511961722488,
+      "eval_loss": 0.561026930809021,
+      "eval_runtime": 1.0204,
+      "eval_samples_per_second": 409.634,
+      "eval_steps_per_second": 51.939,
+      "step": 45
+    },
+    {
+      "epoch": 1.9945205479452055,
+      "eval_accuracy": 0.8133971291866029,
+      "eval_loss": 0.43190622329711914,
+      "eval_runtime": 1.0273,
+      "eval_samples_per_second": 406.884,
+      "eval_steps_per_second": 51.591,
+      "step": 91
+    },
+    {
+      "epoch": 2.958904109589041,
+      "eval_accuracy": 0.8301435406698564,
+      "eval_loss": 0.40697425603866577,
+      "eval_runtime": 1.063,
+      "eval_samples_per_second": 393.225,
+      "eval_steps_per_second": 49.859,
+      "step": 135
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 135,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.964476902528e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-135/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:58bee4dcd5fe0b58b30175a3b929b42d49bdcef85fb7a1c05e452879211375f4
+size 5240

checkpoint-136/config.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_hunger",
+    "1": "1s_pain",
+    "2": "1s_normal",
+    "3": "1s_asphyxia"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": "3",
+    "1s_hunger": "0",
+    "1s_normal": "2",
+    "1s_pain": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-136/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a2b4450db25ba5f0d510ec4e3306e7f346b1218297cc27efb9eb5549200298f0
+size 94765560

checkpoint-136/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a4a094ba38c61e01742a1399183042512757ac7cef90decc84fa9ddd3e292d0
+size 189556666

checkpoint-136/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-136/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05c109a88cfed134d7433f6a487d90e7431aae064934a30eee009d35114d91a8
+size 14244

checkpoint-136/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:02db814972e9031670f30187fddad96ad1438ee30746ac0e08e7fe64a2319de1
+size 1064

checkpoint-136/trainer_state.json ADDED Viewed

	@@ -0,0 +1,60 @@

+{
+  "best_metric": 0.8397129186602871,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-136",
+  "epoch": 2.9808219178082194,
+  "eval_steps": 500,
+  "global_step": 136,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9863013698630136,
+      "eval_accuracy": 0.7942583732057417,
+      "eval_loss": 0.5718334913253784,
+      "eval_runtime": 1.0678,
+      "eval_samples_per_second": 391.448,
+      "eval_steps_per_second": 49.633,
+      "step": 45
+    },
+    {
+      "epoch": 1.9945205479452055,
+      "eval_accuracy": 0.80622009569378,
+      "eval_loss": 0.45444098114967346,
+      "eval_runtime": 1.0491,
+      "eval_samples_per_second": 398.444,
+      "eval_steps_per_second": 50.52,
+      "step": 91
+    },
+    {
+      "epoch": 2.9808219178082194,
+      "eval_accuracy": 0.8397129186602871,
+      "eval_loss": 0.3911355435848236,
+      "eval_runtime": 1.0412,
+      "eval_samples_per_second": 401.464,
+      "eval_steps_per_second": 50.903,
+      "step": 136
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 270,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 6,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.991540198592e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-136/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3c9d41ebe9cd4a0039236a5c6d5456e94aa46eef860ab4ccc1c1578a2a2cbc20
+size 5240

checkpoint-149/config.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_asphyxia",
+    "1": "1s_hunger",
+    "2": "1s_normal",
+    "3": "1s_pain"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": "0",
+    "1s_hunger": "1",
+    "1s_normal": "2",
+    "1s_pain": "3"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-149/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a39cbcf4e451fec6c5adf024114939d0eaeecc9eae9b358985fe76e17a289c71
+size 94765560

checkpoint-149/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:973fe719a94fc7d292682b0cea4b719eda84c95a7325e50f50602418d8e621c8
+size 189556666

checkpoint-149/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-149/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ab240972588ded48883e00b3a1029ab3ff4045470da6447d45f5de8bcf4eb20
+size 14308

checkpoint-149/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1e9ad5796e032f21e10d21d1114e9452b0cd107cc5a4f541c7c91883714189d2
+size 1064

checkpoint-149/trainer_state.json ADDED Viewed

	@@ -0,0 +1,138 @@

+{
+  "best_metric": 0.889261744966443,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-130",
+  "epoch": 8.0,
+  "eval_steps": 500,
+  "global_step": 149,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9664429530201343,
+      "eval_accuracy": 0.7818791946308725,
+      "eval_f1": 0.7264205130236912,
+      "eval_loss": 0.669560968875885,
+      "eval_precision": 0.689807639599501,
+      "eval_recall": 0.7818791946308725,
+      "eval_runtime": 0.9033,
+      "eval_samples_per_second": 329.896,
+      "eval_steps_per_second": 42.067,
+      "step": 18
+    },
+    {
+      "epoch": 1.9865771812080537,
+      "eval_accuracy": 0.7751677852348994,
+      "eval_f1": 0.7202681570933687,
+      "eval_loss": 0.5067932605743408,
+      "eval_precision": 0.684911313518696,
+      "eval_recall": 0.7751677852348994,
+      "eval_runtime": 0.907,
+      "eval_samples_per_second": 328.546,
+      "eval_steps_per_second": 41.895,
+      "step": 37
+    },
+    {
+      "epoch": 2.953020134228188,
+      "eval_accuracy": 0.8087248322147651,
+      "eval_f1": 0.7535236037076262,
+      "eval_loss": 0.43038079142570496,
+      "eval_precision": 0.7241626365959,
+      "eval_recall": 0.8087248322147651,
+      "eval_runtime": 0.8664,
+      "eval_samples_per_second": 343.963,
+      "eval_steps_per_second": 43.861,
+      "step": 55
+    },
+    {
+      "epoch": 3.9731543624161074,
+      "eval_accuracy": 0.8523489932885906,
+      "eval_f1": 0.8433916249277822,
+      "eval_loss": 0.4109182059764862,
+      "eval_precision": 0.8727817866814688,
+      "eval_recall": 0.8523489932885906,
+      "eval_runtime": 0.8712,
+      "eval_samples_per_second": 342.059,
+      "eval_steps_per_second": 43.618,
+      "step": 74
+    },
+    {
+      "epoch": 4.993288590604027,
+      "eval_accuracy": 0.87248322147651,
+      "eval_f1": 0.8717711524765707,
+      "eval_loss": 0.3263051509857178,
+      "eval_precision": 0.8718521382399975,
+      "eval_recall": 0.87248322147651,
+      "eval_runtime": 0.87,
+      "eval_samples_per_second": 342.548,
+      "eval_steps_per_second": 43.681,
+      "step": 93
+    },
+    {
+      "epoch": 5.959731543624161,
+      "eval_accuracy": 0.8825503355704698,
+      "eval_f1": 0.8824400125399595,
+      "eval_loss": 0.3035907447338104,
+      "eval_precision": 0.8824270850226767,
+      "eval_recall": 0.8825503355704698,
+      "eval_runtime": 0.8921,
+      "eval_samples_per_second": 334.055,
+      "eval_steps_per_second": 42.598,
+      "step": 111
+    },
+    {
+      "epoch": 6.97986577181208,
+      "eval_accuracy": 0.889261744966443,
+      "eval_f1": 0.8876321254746313,
+      "eval_loss": 0.3046204149723053,
+      "eval_precision": 0.8891935449502327,
+      "eval_recall": 0.889261744966443,
+      "eval_runtime": 0.894,
+      "eval_samples_per_second": 333.317,
+      "eval_steps_per_second": 42.504,
+      "step": 130
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.8758389261744967,
+      "eval_f1": 0.8770158544888631,
+      "eval_loss": 0.32443463802337646,
+      "eval_precision": 0.8787167286554325,
+      "eval_recall": 0.8758389261744967,
+      "eval_runtime": 0.9094,
+      "eval_samples_per_second": 327.69,
+      "eval_steps_per_second": 41.786,
+      "step": 149
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 216,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 12,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.16506368512e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-149/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:296be9afae72ab3934d873f0cf92f87ef76899c18b11651de670afb49aa1a5d6
+size 5240

checkpoint-167/config.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_asphyxia",
+    "1": "1s_hunger",
+    "2": "1s_normal",
+    "3": "1s_pain"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": "0",
+    "1s_hunger": "1",
+    "1s_normal": "2",
+    "1s_pain": "3"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-167/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99cb84823dab9c2514de746659bd19475207dd5160180a21c19e06c9ee8923f4
+size 94765560

checkpoint-167/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c9a4ee5fa0c7807441f156f570af2346069baaf0c030dadec1c4ab4098330d91
+size 189556666

checkpoint-167/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-167/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f65b53d3587b97669b32f24817b54a83a0d7880d65d1fed7315353b45d1d4bc5
+size 14308

checkpoint-167/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eceb16cd0387067793218afd9bb8832dfde9b5f16ebc34cc0e5baf4d23ab80ef
+size 1064

checkpoint-167/trainer_state.json ADDED Viewed

	@@ -0,0 +1,150 @@

+{
+  "best_metric": 0.9026845637583892,
+  "best_model_checkpoint": "distilhubert-finetuned-mixed-data/checkpoint-167",
+  "epoch": 8.966442953020135,
+  "eval_steps": 500,
+  "global_step": 167,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9664429530201343,
+      "eval_accuracy": 0.7818791946308725,
+      "eval_f1": 0.7264205130236912,
+      "eval_loss": 0.669560968875885,
+      "eval_precision": 0.689807639599501,
+      "eval_recall": 0.7818791946308725,
+      "eval_runtime": 0.9033,
+      "eval_samples_per_second": 329.896,
+      "eval_steps_per_second": 42.067,
+      "step": 18
+    },
+    {
+      "epoch": 1.9865771812080537,
+      "eval_accuracy": 0.7751677852348994,
+      "eval_f1": 0.7202681570933687,
+      "eval_loss": 0.5067932605743408,
+      "eval_precision": 0.684911313518696,
+      "eval_recall": 0.7751677852348994,
+      "eval_runtime": 0.907,
+      "eval_samples_per_second": 328.546,
+      "eval_steps_per_second": 41.895,
+      "step": 37
+    },
+    {
+      "epoch": 2.953020134228188,
+      "eval_accuracy": 0.8087248322147651,
+      "eval_f1": 0.7535236037076262,
+      "eval_loss": 0.43038079142570496,
+      "eval_precision": 0.7241626365959,
+      "eval_recall": 0.8087248322147651,
+      "eval_runtime": 0.8664,
+      "eval_samples_per_second": 343.963,
+      "eval_steps_per_second": 43.861,
+      "step": 55
+    },
+    {
+      "epoch": 3.9731543624161074,
+      "eval_accuracy": 0.8523489932885906,
+      "eval_f1": 0.8433916249277822,
+      "eval_loss": 0.4109182059764862,
+      "eval_precision": 0.8727817866814688,
+      "eval_recall": 0.8523489932885906,
+      "eval_runtime": 0.8712,
+      "eval_samples_per_second": 342.059,
+      "eval_steps_per_second": 43.618,
+      "step": 74
+    },
+    {
+      "epoch": 4.993288590604027,
+      "eval_accuracy": 0.87248322147651,
+      "eval_f1": 0.8717711524765707,
+      "eval_loss": 0.3263051509857178,
+      "eval_precision": 0.8718521382399975,
+      "eval_recall": 0.87248322147651,
+      "eval_runtime": 0.87,
+      "eval_samples_per_second": 342.548,
+      "eval_steps_per_second": 43.681,
+      "step": 93
+    },
+    {
+      "epoch": 5.959731543624161,
+      "eval_accuracy": 0.8825503355704698,
+      "eval_f1": 0.8824400125399595,
+      "eval_loss": 0.3035907447338104,
+      "eval_precision": 0.8824270850226767,
+      "eval_recall": 0.8825503355704698,
+      "eval_runtime": 0.8921,
+      "eval_samples_per_second": 334.055,
+      "eval_steps_per_second": 42.598,
+      "step": 111
+    },
+    {
+      "epoch": 6.97986577181208,
+      "eval_accuracy": 0.889261744966443,
+      "eval_f1": 0.8876321254746313,
+      "eval_loss": 0.3046204149723053,
+      "eval_precision": 0.8891935449502327,
+      "eval_recall": 0.889261744966443,
+      "eval_runtime": 0.894,
+      "eval_samples_per_second": 333.317,
+      "eval_steps_per_second": 42.504,
+      "step": 130
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.8758389261744967,
+      "eval_f1": 0.8770158544888631,
+      "eval_loss": 0.32443463802337646,
+      "eval_precision": 0.8787167286554325,
+      "eval_recall": 0.8758389261744967,
+      "eval_runtime": 0.9094,
+      "eval_samples_per_second": 327.69,
+      "eval_steps_per_second": 41.786,
+      "step": 149
+    },
+    {
+      "epoch": 8.966442953020135,
+      "eval_accuracy": 0.9026845637583892,
+      "eval_f1": 0.9018342908983529,
+      "eval_loss": 0.2961938679218292,
+      "eval_precision": 0.9012011861368664,
+      "eval_recall": 0.9026845637583892,
+      "eval_runtime": 0.8952,
+      "eval_samples_per_second": 332.88,
+      "eval_steps_per_second": 42.448,
+      "step": 167
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 216,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 12,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.43569664576e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-167/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:296be9afae72ab3934d873f0cf92f87ef76899c18b11651de670afb49aa1a5d6
+size 5240

checkpoint-18/config.json ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "1s_asphyxia",
+    "1": "1s_hunger",
+    "2": "1s_normal",
+    "3": "1s_pain"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "1s_asphyxia": "0",
+    "1s_hunger": "1",
+    "1s_normal": "2",
+    "1s_pain": "3"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}