HamzaSidhu786 commited on
Commit
b787dd6
1 Parent(s): 4f1c682

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,13 +1,19 @@
1
  {
2
- "_name_or_path": "ntu-spml/distilhubert",
3
- "activation_dropout": 0.1,
4
- "apply_spec_augment": false,
 
 
 
 
5
  "architectures": [
6
- "HubertForSequenceClassification"
7
  ],
8
  "attention_dropout": 0.1,
9
  "bos_token_id": 1,
10
  "classifier_proj_size": 256,
 
 
11
  "conv_bias": false,
12
  "conv_dim": [
13
  512,
@@ -38,95 +44,135 @@
38
  ],
39
  "ctc_loss_reduction": "sum",
40
  "ctc_zero_infinity": false,
 
41
  "do_stable_layer_norm": false,
42
  "eos_token_id": 2,
43
  "feat_extract_activation": "gelu",
44
  "feat_extract_norm": "group",
45
- "feat_proj_dropout": 0.0,
46
- "feat_proj_layer_norm": false,
47
  "final_dropout": 0.0,
 
48
  "hidden_act": "gelu",
49
  "hidden_dropout": 0.1,
50
  "hidden_size": 768,
51
  "id2label": {
52
- "0": "\u062e\u0627\u0621",
53
- "1": "\u062b\u0627\u0621",
54
- "10": "\u0643\u0627\u0641",
55
- "11": "\u0627\u0644\u0641",
56
- "12": "\u0642\u0627\u0641",
57
- "13": "\u0641\u0627\u0621",
58
- "14": "\u0647\u0627\u0621",
59
- "15": "\u062f\u0627\u0644",
60
- "16": "\u0628\u0627\u0621",
61
- "17": "\u0637\u0627\u0621",
62
  "18": "\u063a\u064a\u0646",
63
- "19": "\u0633\u064a\u0646",
64
- "2": "\u0646\u0648\u0646",
65
- "20": "\u062a\u0627\u0621",
66
- "21": "\u0638\u0627\u0621",
67
- "22": "\u064a\u0627\u0621",
68
- "23": "\u0630\u0627\u0644",
69
- "24": "\u0644\u0627\u0645",
70
- "25": "\u062c\u064a\u0645",
71
- "26": "\u0639\u064a\u0646",
72
- "27": "\u0648\u0627\u0648",
73
- "3": "\u0645\u064a\u0645",
74
- "4": "\u0636\u0627\u062f",
75
- "5": "\u0631\u0627\u0621",
76
- "6": "\u0634\u064a\u0646",
77
- "7": "\u0632\u0627\u064a",
78
- "8": "\u0635\u0627\u062f",
79
- "9": "\u062d\u0627\u0621"
80
  },
81
  "initializer_range": 0.02,
82
  "intermediate_size": 3072,
83
  "label2id": {
84
- "\u0627\u0644\u0641": "11",
85
- "\u0628\u0627\u0621": "16",
86
- "\u062a\u0627\u0621": "20",
87
- "\u062b\u0627\u0621": "1",
88
- "\u062c\u064a\u0645": "25",
89
- "\u062d\u0627\u0621": "9",
90
- "\u062e\u0627\u0621": "0",
91
- "\u062f\u0627\u0644": "15",
92
- "\u0630\u0627\u0644": "23",
93
- "\u0631\u0627\u0621": "5",
94
- "\u0632\u0627\u064a": "7",
95
- "\u0633\u064a\u0646": "19",
96
- "\u0634\u064a\u0646": "6",
97
- "\u0635\u0627\u062f": "8",
98
- "\u0636\u0627\u062f": "4",
99
- "\u0637\u0627\u0621": "17",
100
- "\u0638\u0627\u0621": "21",
101
- "\u0639\u064a\u0646": "26",
102
  "\u063a\u064a\u0646": "18",
103
- "\u0641\u0627\u0621": "13",
104
- "\u0642\u0627\u0641": "12",
105
- "\u0643\u0627\u0641": "10",
106
- "\u0644\u0627\u0645": "24",
107
- "\u0645\u064a\u0645": "3",
108
- "\u0646\u0648\u0646": "2",
109
- "\u0647\u0627\u0621": "14",
110
- "\u0648\u0627\u0648": "27",
111
- "\u064a\u0627\u0621": "22"
112
  },
113
  "layer_norm_eps": 1e-05,
114
  "layerdrop": 0.0,
 
 
 
 
 
115
  "mask_feature_length": 10,
116
  "mask_feature_min_masks": 0,
117
  "mask_feature_prob": 0.0,
118
  "mask_time_length": 10,
119
  "mask_time_min_masks": 2,
 
 
120
  "mask_time_prob": 0.05,
121
- "model_type": "hubert",
 
 
 
 
122
  "num_attention_heads": 12,
 
 
123
  "num_conv_pos_embedding_groups": 16,
124
  "num_conv_pos_embeddings": 128,
125
  "num_feat_extract_layers": 7,
126
- "num_hidden_layers": 2,
 
 
127
  "pad_token_id": 0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
128
  "torch_dtype": "float32",
129
  "transformers_version": "4.42.3",
130
  "use_weighted_layer_sum": false,
131
- "vocab_size": 32
 
132
  }
 
1
  {
2
+ "_name_or_path": "facebook/wav2vec2-base",
3
+ "activation_dropout": 0.0,
4
+ "adapter_attn_dim": null,
5
+ "adapter_kernel_size": 3,
6
+ "adapter_stride": 2,
7
+ "add_adapter": false,
8
+ "apply_spec_augment": true,
9
  "architectures": [
10
+ "Wav2Vec2ForSequenceClassification"
11
  ],
12
  "attention_dropout": 0.1,
13
  "bos_token_id": 1,
14
  "classifier_proj_size": 256,
15
+ "codevector_dim": 256,
16
+ "contrastive_logits_temperature": 0.1,
17
  "conv_bias": false,
18
  "conv_dim": [
19
  512,
 
44
  ],
45
  "ctc_loss_reduction": "sum",
46
  "ctc_zero_infinity": false,
47
+ "diversity_loss_weight": 0.1,
48
  "do_stable_layer_norm": false,
49
  "eos_token_id": 2,
50
  "feat_extract_activation": "gelu",
51
  "feat_extract_norm": "group",
52
+ "feat_proj_dropout": 0.1,
53
+ "feat_quantizer_dropout": 0.0,
54
  "final_dropout": 0.0,
55
+ "freeze_feat_extract_train": true,
56
  "hidden_act": "gelu",
57
  "hidden_dropout": 0.1,
58
  "hidden_size": 768,
59
  "id2label": {
60
+ "0": "\u0627\u0644\u0641",
61
+ "1": "\u0628\u0627\u0621",
62
+ "10": "\u0632\u0627\u064a",
63
+ "11": "\u0633\u064a\u0646",
64
+ "12": "\u0634\u064a\u0646",
65
+ "13": "\u0635\u0627\u062f",
66
+ "14": "\u0636\u0627\u062f",
67
+ "15": "\u0637\u0627\u0621",
68
+ "16": "\u0638\u0627\u0621",
69
+ "17": "\u0639\u064a\u0646",
70
  "18": "\u063a\u064a\u0646",
71
+ "19": "\u0641\u0627\u0621",
72
+ "2": "\u062a\u0627\u0621",
73
+ "20": "\u0642\u0627\u0641",
74
+ "21": "\u0643\u0627\u0641",
75
+ "22": "\u0644\u0627\u0645",
76
+ "23": "\u0645\u064a\u0645",
77
+ "24": "\u0646\u0648\u0646",
78
+ "25": "\u0647\u0627\u0621",
79
+ "26": "\u0648\u0627\u0648",
80
+ "27": "\u064a\u0627\u0621",
81
+ "3": "\u062b\u0627\u0621",
82
+ "4": "\u062c\u064a\u0645",
83
+ "5": "\u062d\u0627\u0621",
84
+ "6": "\u062e\u0627\u0621",
85
+ "7": "\u062f\u0627\u0644",
86
+ "8": "\u0630\u0627\u0644",
87
+ "9": "\u0631\u0627\u0621"
88
  },
89
  "initializer_range": 0.02,
90
  "intermediate_size": 3072,
91
  "label2id": {
92
+ "\u0627\u0644\u0641": "0",
93
+ "\u0628\u0627\u0621": "1",
94
+ "\u062a\u0627\u0621": "2",
95
+ "\u062b\u0627\u0621": "3",
96
+ "\u062c\u064a\u0645": "4",
97
+ "\u062d\u0627\u0621": "5",
98
+ "\u062e\u0627\u0621": "6",
99
+ "\u062f\u0627\u0644": "7",
100
+ "\u0630\u0627\u0644": "8",
101
+ "\u0631\u0627\u0621": "9",
102
+ "\u0632\u0627\u064a": "10",
103
+ "\u0633\u064a\u0646": "11",
104
+ "\u0634\u064a\u0646": "12",
105
+ "\u0635\u0627\u062f": "13",
106
+ "\u0636\u0627\u062f": "14",
107
+ "\u0637\u0627\u0621": "15",
108
+ "\u0638\u0627\u0621": "16",
109
+ "\u0639\u064a\u0646": "17",
110
  "\u063a\u064a\u0646": "18",
111
+ "\u0641\u0627\u0621": "19",
112
+ "\u0642\u0627\u0641": "20",
113
+ "\u0643\u0627\u0641": "21",
114
+ "\u0644\u0627\u0645": "22",
115
+ "\u0645\u064a\u0645": "23",
116
+ "\u0646\u0648\u0646": "24",
117
+ "\u0647\u0627\u0621": "25",
118
+ "\u0648\u0627\u0648": "26",
119
+ "\u064a\u0627\u0621": "27"
120
  },
121
  "layer_norm_eps": 1e-05,
122
  "layerdrop": 0.0,
123
+ "mask_channel_length": 10,
124
+ "mask_channel_min_space": 1,
125
+ "mask_channel_other": 0.0,
126
+ "mask_channel_prob": 0.0,
127
+ "mask_channel_selection": "static",
128
  "mask_feature_length": 10,
129
  "mask_feature_min_masks": 0,
130
  "mask_feature_prob": 0.0,
131
  "mask_time_length": 10,
132
  "mask_time_min_masks": 2,
133
+ "mask_time_min_space": 1,
134
+ "mask_time_other": 0.0,
135
  "mask_time_prob": 0.05,
136
+ "mask_time_selection": "static",
137
+ "model_type": "wav2vec2",
138
+ "no_mask_channel_overlap": false,
139
+ "no_mask_time_overlap": false,
140
+ "num_adapter_layers": 3,
141
  "num_attention_heads": 12,
142
+ "num_codevector_groups": 2,
143
+ "num_codevectors_per_group": 320,
144
  "num_conv_pos_embedding_groups": 16,
145
  "num_conv_pos_embeddings": 128,
146
  "num_feat_extract_layers": 7,
147
+ "num_hidden_layers": 12,
148
+ "num_negatives": 100,
149
+ "output_hidden_size": 768,
150
  "pad_token_id": 0,
151
+ "proj_codevector_dim": 256,
152
+ "tdnn_dilation": [
153
+ 1,
154
+ 2,
155
+ 3,
156
+ 1,
157
+ 1
158
+ ],
159
+ "tdnn_dim": [
160
+ 512,
161
+ 512,
162
+ 512,
163
+ 512,
164
+ 1500
165
+ ],
166
+ "tdnn_kernel": [
167
+ 5,
168
+ 3,
169
+ 3,
170
+ 1,
171
+ 1
172
+ ],
173
  "torch_dtype": "float32",
174
  "transformers_version": "4.42.3",
175
  "use_weighted_layer_sum": false,
176
+ "vocab_size": 32,
177
+ "xvector_output_dim": 512
178
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:149889981493cc6b6c86e1c1e0aca5000b11f3721278b924351f93c6ef8b5529
3
- size 94790240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:003114ba63e705676627cc1d192700bc80f14aeb5ffe8bd17ad7b28d4b1ae360
3
+ size 378329104
preprocessor_config.json CHANGED
@@ -3,7 +3,7 @@
3
  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
  "feature_size": 1,
5
  "padding_side": "right",
6
- "padding_value": 0,
7
- "return_attention_mask": true,
8
  "sampling_rate": 16000
9
  }
 
3
  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
  "feature_size": 1,
5
  "padding_side": "right",
6
+ "padding_value": 0.0,
7
+ "return_attention_mask": false,
8
  "sampling_rate": 16000
9
  }
runs/Aug03_20-00-25_e97ec11884da/events.out.tfevents.1722715290.e97ec11884da.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72367e039faeaadc78cc465f029e60775f563ef3e23f1c6b0ce1d5d4461b03c2
3
+ size 16767
runs/Aug03_20-13-58_e97ec11884da/events.out.tfevents.1722716095.e97ec11884da.34.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59455cad4592ee4948830932a3ed726372b34239a1f9ba5beefcec496136c8eb
3
+ size 32071
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd8ff9d63785cfa9c21d5d3c102863736b3f94b93b5bddd53ff40dc74e745c2e
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0df6344fdd92af6ed3162b79944db931ab54a5b1cad53703c97e1ce48a3e5a2b
3
  size 5176