Upload StyleTTS2 checkpoint epoch_2nd_00003.pth with all inference components

Files changed (15) hide show

README.md CHANGED Viewed

@@ -16,16 +16,16 @@ This model is a fine-tuned version of StyleTTS2, containing all necessary compon
 - **Base Model:** StyleTTS2-LibriTTS
 - **Architecture:** StyleTTS2
 - **Task:** Text-to-Speech
-- **Last Checkpoint:** epoch_2nd_00009.pth
 ## Training Details
-- **Total Epochs:** 10
-- **Completed Epochs:** 9
-- **Total Iterations:** 4080
 - **Batch Size:** 2
-- **Max Length:** 630
 - **Learning Rate:** 0.0001
-- **Final Validation Loss:** 0.407607
 ## Model Components
 The repository includes all necessary components for inference:

 - **Base Model:** StyleTTS2-LibriTTS
 - **Architecture:** StyleTTS2
 - **Task:** Text-to-Speech
+- **Last Checkpoint:** epoch_2nd_00003.pth
 ## Training Details
+- **Total Epochs:** 5
+- **Completed Epochs:** 3
+- **Total Iterations:** 3384
 - **Batch Size:** 2
+- **Max Length:** 600
 - **Learning Rate:** 0.0001
+- **Final Validation Loss:** 0.399824
 ## Model Components
 The repository includes all necessary components for inference:

bert.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2f0264bc954462e498ae0affe1c4161b36e8029bbc76c869087c9b40917b95f8
 size 25178740

 version https://git-lfs.github.com/spec/v1
+oid sha256:f8547df3d46173d36f32153f6f5d0536a98bd9cd06ac53026946ff89dafdbf5d
 size 25178740

bert_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:987897733e7e7b710f6833233801b8545f9677397725acc79ee5cae34debf7cd
 size 1576502

 version https://git-lfs.github.com/spec/v1
+oid sha256:51a5c0ae501ee18c60230d9194c1666312297aab3f56961968ba1915efe81e95
 size 1576502

checkpoint.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8abbfa93106ef4950644e1de293e7fae3383911059f2ec110c641843b74bb420
 size 2242747934

 version https://git-lfs.github.com/spec/v1
+oid sha256:4867d7892552a55810009454aa79bed07670a40e5ebc03e3d1f1848fc3650f5b
 size 2242747934

config.json CHANGED Viewed

@@ -72,9 +72,9 @@
     "style_dim": 128
   },
   "training_config": {
-    "epochs": 10,
     "batch_size": 2,
-    "max_len": 630,
     "optimizer": {
       "bert_lr": 1e-05,
       "ft_lr": 0.0001,
@@ -112,9 +112,9 @@
     "val_data": "Data/val_list.txt"
   },
   "model_state": {
-    "epoch": 9,
-    "iterations": 4080,
-    "val_loss": 0.40760722756385803
   },
   "training_metrics": {
     "train_loss": [],
@@ -135,7 +135,12 @@
       29.0,
       11.0,
       52.0,
-      48.0
     ],
     "dur_loss": [
       0.44,
@@ -154,7 +159,12 @@
       0.399,
       0.409,
       0.397,
-      0.408
     ],
     "F0_loss": [
       2.865,
@@ -173,7 +183,12 @@
       2.515,
       2.663,
       2.66,
-      2.477
     ],
     "epochs": [
       1,
@@ -192,7 +207,12 @@
       14,
       15,
       16,
-      17
     ]
   }
 }

     "style_dim": 128
   },
   "training_config": {
+    "epochs": 5,
     "batch_size": 2,
+    "max_len": 600,
     "optimizer": {
       "bert_lr": 1e-05,
       "ft_lr": 0.0001,
     "val_data": "Data/val_list.txt"
   },
   "model_state": {
+    "epoch": 3,
+    "iterations": 3384,
+    "val_loss": 0.39982396364212036
   },
   "training_metrics": {
     "train_loss": [],
       29.0,
       11.0,
       52.0,
+      48.0,
+      18.0,
+      5.0,
+      4.0,
+      57.0,
+      9.0
     ],
     "dur_loss": [
       0.44,
       0.399,
       0.409,
       0.397,
+      0.408,
+      0.432,
+      0.404,
+      0.406,
+      0.4,
+      0.403
     ],
     "F0_loss": [
       2.865,
       2.515,
       2.663,
       2.66,
+      2.477,
+      1.751,
+      1.739,
+      1.76,
+      1.691,
+      1.72
     ],
     "epochs": [
       1,
       14,
       15,
       16,
+      17,
+      18,
+      19,
+      20,
+      21,
+      22
     ]
   }
 }

decoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:93e8cad16f38b082ebd13c2f75c41ee8165fd4533241ca8f5df61368c0a3587c
 size 217409318

 version https://git-lfs.github.com/spec/v1
+oid sha256:8385ec0be347a4251cddfd7391ac2e3a468c77967caddb023f13d5c5d2232343
 size 217409318

diffusion.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e51e3b27078fa10c2fc80c502567edaf2d8355aa287683b4d4915d7a2c4f3913
 size 101337326

 version https://git-lfs.github.com/spec/v1
+oid sha256:8324d4c337027ced9ac87fe0018ff90cb74fa8d2652ea6cdf2a9d3f0ed232a3f
 size 101337326

mpd.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a140e610e83ccd6e9407be6b13f9ddff5121525ff3af9319713adb8d6861cc17
 size 164447824

 version https://git-lfs.github.com/spec/v1
+oid sha256:0a7cc86c797abefbcb2b5f60c8f5416f5366d1bbde05c203d5828266655fe974
 size 164447824

msd.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1bd53c1bb0b77a649e2208095f2828d71ed57ac4b9bdbebebc93f4b2cc5550ec
 size 1139020

 version https://git-lfs.github.com/spec/v1
+oid sha256:19d2b444de08e4e33b867114da66af862cc9a20f3ee2778a147bf4689395f15d
 size 1139020

predictor.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:37bf44866e70d0c11616661ce4a02c1a8d172f1c222cf246684ba1c4ad57f6df
 size 64813639

 version https://git-lfs.github.com/spec/v1
+oid sha256:a7fcdf269e32fe125ca2bc3095a4c8a591b1034d886ccbcc7bc6cc808722cacc
 size 64813639

predictor_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ac439c809ecffef6cf8d130be1888781916358489101f9d1b0f967ad3f5337e2
 size 55547155

 version https://git-lfs.github.com/spec/v1
+oid sha256:ef15e2dcf88df69ec0e3b324f481de2c1b387c047e0a2375ab9219b924594aca
 size 55547155

style_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:478c67e53980c87515d613b9afd79055584930cf00c56266b938a6b432d16902
 size 55546871

 version https://git-lfs.github.com/spec/v1
+oid sha256:66f099fbedb7cd0cc47fa849f9efa2bd076a70285fd36062ed89b97725d2ce03
 size 55546871

text_aligner.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dad7dc341e2e7b8095f29aa7513f01ddec5d1be410f09fbd3adb6b41b2f27b52
 size 31531315

 version https://git-lfs.github.com/spec/v1
+oid sha256:1e8d32afb6ff2248713b03d1e73d5fbe6ada4f50be8575e86fb537a189f9d080
 size 31531315

text_encoder.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6d611064414bd8a986460aad4f93666b5f7fa98aa131de2bdbe3dd27ee430332
 size 22432460

 version https://git-lfs.github.com/spec/v1
+oid sha256:11cad4fab0fd34170fdd88a62129dac783dbd25eedaba045a65f2d760030462a
 size 22432460

training_metrics.png CHANGED Viewed