Upload StyleTTS2 checkpoint epoch_2nd_00009.pth with all inference components

Files changed (15) hide show

README.md CHANGED Viewed

@@ -16,16 +16,16 @@ This model is a fine-tuned version of StyleTTS2, containing all necessary compon
 - **Base Model:** StyleTTS2-LibriTTS
 - **Architecture:** StyleTTS2
 - **Task:** Text-to-Speech
-- **Last Checkpoint:** epoch_2nd_00014.pth
 ## Training Details
-- **Total Epochs:** 15
-- **Completed Epochs:** 14
-- **Total Iterations:** 1164
 - **Batch Size:** 2
 - **Max Length:** 120
 - **Learning Rate:** 0.0001
-- **Final Validation Loss:** 0.413268
 ## Model Components
 The repository includes all necessary components for inference:

 - **Base Model:** StyleTTS2-LibriTTS
 - **Architecture:** StyleTTS2
 - **Task:** Text-to-Speech
+- **Last Checkpoint:** epoch_2nd_00009.pth
 ## Training Details
+- **Total Epochs:** 30
+- **Completed Epochs:** 9
+- **Total Iterations:** 774
 - **Batch Size:** 2
 - **Max Length:** 120
 - **Learning Rate:** 0.0001
+- **Final Validation Loss:** 0.422153
 ## Model Components
 The repository includes all necessary components for inference:

bert.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f51aba710a80251e4b252b7b78396278dd072571850639d9a1e9715f16d52f5c
 size 25178740

 version https://git-lfs.github.com/spec/v1
+oid sha256:1413a5cdfa34300aed0fe9a718e19631cb65b632d9a672ac27ecffd0eb81675f
 size 25178740

bert_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a65fc879992544e8f23c6202f202b7faf97cf2dc10a04d28498394b2070c23a6
 size 1576502

 version https://git-lfs.github.com/spec/v1
+oid sha256:fffeaf7ea2ece022f6cc3abe7a40e902a60482e842ba4eaa5eb3a450fc0f6178
 size 1576502

checkpoint.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:29bb646b43d5c6a6837ef280ccfc81c9c9bcdc27edf2e48266e1356fa8793fb9
-size 2242747934

 version https://git-lfs.github.com/spec/v1
+oid sha256:a6b1e42a03ddeab22116f039e0b819312600e496dd6882e74909f063083431c7
+size 2040092478

config.json CHANGED Viewed

@@ -72,7 +72,7 @@
     "style_dim": 128
   },
   "training_config": {
-    "epochs": 15,
     "batch_size": 2,
     "max_len": 120,
     "optimizer": {
@@ -112,62 +112,53 @@
     "val_data": "Data/val_list.txt"
   },
   "model_state": {
-    "epoch": 14,
-    "iterations": 1164,
-    "val_loss": 0.41326767206192017
   },
   "training_metrics": {
     "train_loss": [],
     "val_loss": [
-      7.0,
-      1.0,
       56.0,
-      50.0,
-      47.0,
-      54.0,
       48.0,
-      47.0,
-      42.0,
-      41.0,
-      5.0,
-      8.0,
-      12.0,
-      19.0,
-      27.0
     ],
     "dur_loss": [
-      0.46,
-      0.443,
-      0.456,
       0.431,
-      0.433,
-      0.472,
-      0.45,
-      0.443,
-      0.429,
-      0.423,
-      0.445,
-      0.453,
-      0.428,
-      0.406,
-      0.413
     ],
     "F0_loss": [
-      1.32,
       1.218,
-      1.247,
-      1.179,
-      1.17,
-      1.045,
-      1.124,
-      1.138,
-      1.081,
-      1.116,
-      1.159,
-      1.134,
-      1.042,
-      1.115,
-      1.204
     ],
     "epochs": [
       1,
@@ -181,10 +172,7 @@
       9,
       10,
       11,
-      12,
-      13,
-      14,
-      15
     ]
   }
 }

     "style_dim": 128
   },
   "training_config": {
+    "epochs": 30,
     "batch_size": 2,
     "max_len": 120,
     "optimizer": {
     "val_data": "Data/val_list.txt"
   },
   "model_state": {
+    "epoch": 9,
+    "iterations": 774,
+    "val_loss": 0.4221532940864563
   },
   "training_metrics": {
     "train_loss": [],
     "val_loss": [
+      26.0,
+      21.0,
+      12.0,
+      5.0,
+      57.0,
+      4.0,
       56.0,
       48.0,
+      39.0,
+      34.0,
+      53.0,
+      2.0
     ],
     "dur_loss": [
+      0.434,
+      0.481,
+      0.437,
       0.431,
+      0.42,
+      0.43,
+      0.463,
+      0.436,
+      0.437,
+      0.422,
+      0.432,
+      0.425
     ],
     "F0_loss": [
+      1.093,
+      1.175,
+      1.097,
+      1.123,
+      1.108,
+      1.183,
       1.218,
+      1.246,
+      1.048,
+      0.998,
+      1.156,
+      1.026
     ],
     "epochs": [
       1,
       9,
       10,
       11,
+      12
     ]
   }
 }

decoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6e3bf502db9782b9c7417becf6e91fba743f04b554d62675240f8aa5a213ab0d
 size 217409318

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d6eb7d149bfb8cf2a0d927f30df312371b72b00e7959c3e6f3d7371d574a0f2
 size 217409318

diffusion.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cac9fa21ef2552bec66319719e8936e5bce7abdc8bbaadbd197c0aa72d7f5519
 size 101337326

 version https://git-lfs.github.com/spec/v1
+oid sha256:69229a607b119bf2c180406e680c1e06acefc44ec4d51fe294040f5215cb8a68
 size 101337326

mpd.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dd845baaecf264fba32025d15740f2d70d8fd54c6da12424707e40c94b29519f
 size 164447824

 version https://git-lfs.github.com/spec/v1
+oid sha256:7c84bd61e997bdd1adec21249172906274abfe395992735d202419000dd544c9
 size 164447824

msd.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3b3a80730e8f644d0fe65c6d2dc647940257a876d9e49fc3938f2bf29ae0b17b
 size 1139020

 version https://git-lfs.github.com/spec/v1
+oid sha256:b9f48c1161e725906d25583784a23a49091934b0e73edd2b1a024bb077bcabfe
 size 1139020

predictor.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f60676a63a89488920921d77b523b0603992cb56f3bfcee3670a2ce6e5722200
 size 64813639

 version https://git-lfs.github.com/spec/v1
+oid sha256:eafafa34fa9d2b4a9268382dadc4a844c3f7dd900faf86a36fab3170c0e6f7bf
 size 64813639

predictor_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:393412704e6233e434ed3438130b4b1b4f8f826b708105d680dbd212c2b43ebc
 size 55547155

 version https://git-lfs.github.com/spec/v1
+oid sha256:3c92fae2c2b4fe19e8eb5c07176f9225a839e625e801acdcf0c16e22b75fe492
 size 55547155

style_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a06b3a76e5750aa287f15bac9fbaf55d2523f846204c8b8b727ea31e41be8771
 size 55546871

 version https://git-lfs.github.com/spec/v1
+oid sha256:4ef0b741adf3b2b9b4e40cd4eaad7bfbd1ececb5681d72ded1f2ae0a09af6f1a
 size 55546871

text_aligner.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7cbeb7e22a8744a7802858755f9c0f6e16d473ed97688e75d7f98e7947f444cb
 size 31531315

 version https://git-lfs.github.com/spec/v1
+oid sha256:b8889fdb9194441fa54090c37b8d3e050a2d8904220c9db53bbef8f319c8cf25
 size 31531315

text_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e7aef4141ba1fdfe9ee8c1acfd4535926ade21c288a23f48018c6a1f94d1d744
 size 22432460

 version https://git-lfs.github.com/spec/v1
+oid sha256:66fcdb1d2c4fac5943dca1326132d637bec7eb42f93ee1bfd5c8ee580a161aee
 size 22432460

training_metrics.png CHANGED Viewed