mrq commited on
Commit
d606fd5
·
1 Parent(s): 96dc9c7
ckpt/ar+nar-double-retnet-4/fp32.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a9a4537d4ccfff0f5ececdb46d2342b0de2879837417ef11e23fc028f3d3f99
3
- size 827624127
 
 
 
 
ckpt/ar+nar-retnet-4/fp32.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:548246e8f11ed3cb13ec3f520a665e02fe6227d979f63b832a8bc036f0c0a67b
3
- size 424338659
 
 
 
 
ckpt/ar-retnet-4/fp32.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e042d05f14f21a166cd5f5c16b9c9c4ac9ce18af2a4c285c7f0d3ef3ea6729bf
3
- size 418040575
 
 
 
 
ckpt/nar-retnet-4/fp32.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:18027cafe3c077cb8786a5665f04f732f4e3fcacff17844182f9383a1dca640f
3
- size 422230719
 
 
 
 
config.ar_nar_double.yaml DELETED
@@ -1,105 +0,0 @@
1
- dataset:
2
- training: [
3
- ]
4
- validation: [
5
- ]
6
- noise: [
7
- ]
8
-
9
- speaker_name_getter: "lambda p: f'{p.parts[-3]}_{p.parts[-2]}'"
10
-
11
- use_hdf5: True
12
- use_metadata: True
13
- hdf5_flag: r
14
- validate: True
15
-
16
- workers: 4
17
- cache: True
18
-
19
- phones_range: [4, 256]
20
- duration_range: [1.0, 16.0]
21
-
22
- random_utterance: 1.0
23
- max_prompts: 3
24
- prompt_duration: 3.0
25
-
26
- sample_type: speaker
27
-
28
- tasks_list: ["tts"] # , "ns", "sr", "tse", "cse", "nse", "tts"]
29
-
30
- models:
31
- _prom_levels: 4
32
- _max_levels: 8
33
-
34
- _models:
35
- - name: "ar+nar"
36
- size: "double"
37
- resp_levels: 4
38
- prom_levels: 4
39
- tasks: 8
40
- arch_type: "retnet"
41
- training: True
42
-
43
- hyperparameters:
44
- batch_size: 8
45
- gradient_accumulation_steps: 1
46
- gradient_clipping: 100
47
-
48
- optimizer: AdamW
49
- learning_rate: 1.0e-5
50
-
51
- scheduler_type: ""
52
-
53
- evaluation:
54
- batch_size: 16
55
- frequency: 500
56
- size: 16
57
-
58
- steps: 300
59
- ar_temperature: 0.95
60
- nar_temperature: 0.25
61
- load_disabled_engines: True
62
-
63
- trainer:
64
- iterations: 1_000_000
65
-
66
- save_tag: step
67
- save_on_oom: True
68
- save_on_quit: True
69
- save_frequency: 500
70
- export_on_save: True
71
-
72
- keep_last_checkpoints: 4
73
-
74
- aggressive_optimizations: False
75
- load_disabled_engines: False
76
-
77
- load_state_dict: True
78
-
79
- gc_mode: None # "global_step"
80
-
81
- weight_dtype: float32
82
- amp: False
83
-
84
- backend: local
85
- deepspeed:
86
- zero_optimization_level: 0
87
- use_compression_training: True
88
-
89
- inference:
90
- weight_dtype: float32
91
- amp: False
92
-
93
- use_vocos: True
94
- normalize: False
95
-
96
- recurrent_chunk_size: 0
97
- recurrent_forward: False
98
-
99
- bitsandbytes:
100
- enabled: False
101
- injects: True
102
- linear: True
103
- embedding: True
104
-
105
- device: cpu