Upload StyleTTS2 checkpoint epoch_2nd_00029.pth with all inference components

Browse files

Files changed (15) hide show

README.md +5 -5
bert.pth +1 -1
bert_encoder.pth +1 -1
checkpoint.pth +2 -2
config.json +128 -8
decoder.pth +1 -1
diffusion.pth +1 -1
mpd.pth +1 -1
msd.pth +1 -1
predictor.pth +1 -1
predictor_encoder.pth +1 -1
style_encoder.pth +1 -1
text_aligner.pth +1 -1
text_encoder.pth +1 -1
training_metrics.png +0 -0

README.md CHANGED Viewed

@@ -16,16 +16,16 @@ This model is a fine-tuned version of StyleTTS2, containing all necessary compon
 - **Base Model:** StyleTTS2-LibriTTS
 - **Architecture:** StyleTTS2
 - **Task:** Text-to-Speech
-- **Last Checkpoint:** epoch_2nd_00009.pth
 ## Training Details
 - **Total Epochs:** 30
-- **Completed Epochs:** 9
-- **Total Iterations:** 774
 - **Batch Size:** 2
-- **Max Length:** 120
 - **Learning Rate:** 0.0001
-- **Final Validation Loss:** 0.422153
 ## Model Components
 The repository includes all necessary components for inference:

 - **Base Model:** StyleTTS2-LibriTTS
 - **Architecture:** StyleTTS2
 - **Task:** Text-to-Speech
+- **Last Checkpoint:** epoch_2nd_00029.pth
 ## Training Details
 - **Total Epochs:** 30
+- **Completed Epochs:** 29
+- **Total Iterations:** 2341
 - **Batch Size:** 2
+- **Max Length:** 110
 - **Learning Rate:** 0.0001
+- **Final Validation Loss:** 0.405025
 ## Model Components
 The repository includes all necessary components for inference:

bert.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1413a5cdfa34300aed0fe9a718e19631cb65b632d9a672ac27ecffd0eb81675f
 size 25178740

 version https://git-lfs.github.com/spec/v1
+oid sha256:6158ffbde4828b5bd729e0d5d1f8759432bfdbf5f3923c7ac77ed88f1dad37ad
 size 25178740

bert_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fffeaf7ea2ece022f6cc3abe7a40e902a60482e842ba4eaa5eb3a450fc0f6178
 size 1576502

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb4c35a681712953ef701d4bedaa227908a5e5e57b20daa604649e6a293c7b1c
 size 1576502

checkpoint.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a6b1e42a03ddeab22116f039e0b819312600e496dd6882e74909f063083431c7
-size 2040092478

 version https://git-lfs.github.com/spec/v1
+oid sha256:50a108ca11a998e804ad4898c6d9e220101e6ff6ac0ef7f7eeeb10433ac1e50e
+size 2242747934

config.json CHANGED Viewed

@@ -74,7 +74,7 @@
   "training_config": {
     "epochs": 30,
     "batch_size": 2,
-    "max_len": 120,
     "optimizer": {
       "bert_lr": 1e-05,
       "ft_lr": 0.0001,
@@ -112,9 +112,9 @@
     "val_data": "Data/val_list.txt"
   },
   "model_state": {
-    "epoch": 9,
-    "iterations": 774,
-    "val_loss": 0.4221532940864563
   },
   "training_metrics": {
     "train_loss": [],
@@ -130,7 +130,37 @@
       39.0,
       34.0,
       53.0,
-      2.0
     ],
     "dur_loss": [
       0.434,
@@ -144,7 +174,37 @@
       0.437,
       0.422,
       0.432,
-      0.425
     ],
     "F0_loss": [
       1.093,
@@ -158,7 +218,37 @@
       1.048,
       0.998,
       1.156,
-      1.026
     ],
     "epochs": [
       1,
@@ -172,7 +262,37 @@
       9,
       10,
       11,
-      12
     ]
   }
 }

   "training_config": {
     "epochs": 30,
     "batch_size": 2,
+    "max_len": 110,
     "optimizer": {
       "bert_lr": 1e-05,
       "ft_lr": 0.0001,
     "val_data": "Data/val_list.txt"
   },
   "model_state": {
+    "epoch": 29,
+    "iterations": 2341,
+    "val_loss": 0.40502485632896423
   },
   "training_metrics": {
     "train_loss": [],
       39.0,
       34.0,
       53.0,
+      2.0,
+      5.0,
+      50.0,
+      38.0,
+      26.0,
+      13.0,
+      13.0,
+      2.0,
+      49.0,
+      37.0,
+      23.0,
+      41.0,
+      40.0,
+      42.0,
+      41.0,
+      39.0,
+      58.0,
+      55.0,
+      54.0,
+      51.0,
+      50.0,
+      3.0,
+      1.0,
+      0.0,
+      5.0,
+      3.0,
+      41.0,
+      39.0,
+      35.0,
+      32.0,
+      30.0
     ],
     "dur_loss": [
       0.434,
       0.437,
       0.422,
       0.432,
+      0.425,
+      0.456,
+      0.462,
+      0.45,
+      0.427,
+      0.456,
+      0.428,
+      0.438,
+      0.422,
+      0.428,
+      0.432,
+      0.44,
+      0.423,
+      0.431,
+      0.449,
+      0.414,
+      0.427,
+      0.447,
+      0.45,
+      0.435,
+      0.428,
+      0.426,
+      0.417,
+      0.425,
+      0.434,
+      0.412,
+      0.415,
+      0.422,
+      0.398,
+      0.416,
+      0.405
     ],
     "F0_loss": [
       1.093,
       1.048,
       0.998,
       1.156,
+      1.026,
+      1.196,
+      1.173,
+      1.148,
+      1.264,
+      1.266,
+      1.115,
+      1.089,
+      1.103,
+      1.178,
+      1.108,
+      1.106,
+      1.151,
+      1.217,
+      1.187,
+      1.04,
+      1.111,
+      1.17,
+      1.195,
+      1.087,
+      1.144,
+      1.121,
+      1.18,
+      1.206,
+      1.125,
+      1.101,
+      1.072,
+      1.099,
+      1.223,
+      1.188,
+      1.097
     ],
     "epochs": [
       1,
       9,
       10,
       11,
+      12,
+      13,
+      14,
+      15,
+      16,
+      17,
+      18,
+      19,
+      20,
+      21,
+      22,
+      23,
+      24,
+      25,
+      26,
+      27,
+      28,
+      29,
+      30,
+      31,
+      32,
+      33,
+      34,
+      35,
+      36,
+      37,
+      38,
+      39,
+      40,
+      41,
+      42
     ]
   }
 }

decoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9d6eb7d149bfb8cf2a0d927f30df312371b72b00e7959c3e6f3d7371d574a0f2
 size 217409318

 version https://git-lfs.github.com/spec/v1
+oid sha256:815400ba8f1bd08fd28db9ef9330ef2be5d5cac52224fd6d0914864831ae1102
 size 217409318

diffusion.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:69229a607b119bf2c180406e680c1e06acefc44ec4d51fe294040f5215cb8a68
 size 101337326

 version https://git-lfs.github.com/spec/v1
+oid sha256:bae1a9abccdb586c140a4c65231a7cc97766e8fbd9bb20e7b261ff7e2439baf0
 size 101337326

mpd.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7c84bd61e997bdd1adec21249172906274abfe395992735d202419000dd544c9
 size 164447824

 version https://git-lfs.github.com/spec/v1
+oid sha256:8ff78d274d70254f641c679ec166a7b664ef91710a7fce8f69538b493a6d69da
 size 164447824

msd.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b9f48c1161e725906d25583784a23a49091934b0e73edd2b1a024bb077bcabfe
 size 1139020

 version https://git-lfs.github.com/spec/v1
+oid sha256:2ddda48ce7bd021ebe7256cfe613cf17f69aba81c355cf6a37f36c6680956737
 size 1139020

predictor.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:eafafa34fa9d2b4a9268382dadc4a844c3f7dd900faf86a36fab3170c0e6f7bf
 size 64813639

 version https://git-lfs.github.com/spec/v1
+oid sha256:c01733aea2d2835e5ecfc8afe7ec1691bc8aaa0e651bc78d5dfdbe2cc028d556
 size 64813639

predictor_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3c92fae2c2b4fe19e8eb5c07176f9225a839e625e801acdcf0c16e22b75fe492
 size 55547155

 version https://git-lfs.github.com/spec/v1
+oid sha256:ccbce2062e8de35c1e925ffa808b7f18790cb4a35370d324b3782829768fa478
 size 55547155

style_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4ef0b741adf3b2b9b4e40cd4eaad7bfbd1ececb5681d72ded1f2ae0a09af6f1a
 size 55546871

 version https://git-lfs.github.com/spec/v1
+oid sha256:9bff0b6024b314cf39d629322e025f324872b77621e7eff3e4083359156ad64e
 size 55546871

text_aligner.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b8889fdb9194441fa54090c37b8d3e050a2d8904220c9db53bbef8f319c8cf25
 size 31531315

 version https://git-lfs.github.com/spec/v1
+oid sha256:4efc44b688aa089711691b7fae48767d3b8f461e519d749a5ed938d95b24a89c
 size 31531315

text_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:66fcdb1d2c4fac5943dca1326132d637bec7eb42f93ee1bfd5c8ee580a161aee
 size 22432460

 version https://git-lfs.github.com/spec/v1
+oid sha256:ce4cf0da486560c3370a74f2a06a9d025c61d2361d6a54bedea7b6b302455784
 size 22432460

training_metrics.png CHANGED Viewed