bghira commited on
Commit
3b244a5
1 Parent(s): cdc99cd

Model card auto-generated by SimpleTuner

Browse files
Files changed (1) hide show
  1. README.md +5 -8
README.md CHANGED
@@ -143,13 +143,13 @@ You may reuse the base model text encoder for inference.
143
  - Training steps: 100
144
  - Learning rate: 1e-05
145
  - Max grad norm: 0.01
146
- - Effective batch size: 12
147
- - Micro-batch size: 4
148
  - Gradient accumulation steps: 1
149
  - Number of GPUs: 3
150
  - Prediction type: flow-matching
151
  - Rescaled betas zero SNR: False
152
- - Optimizer: optimi-lion
153
  - Precision: Pure BF16
154
  - Quantised: Yes: int8-quanto
155
  - Xformers: Not used
@@ -165,14 +165,11 @@ You may reuse the base model text encoder for inference.
165
  "factor": 12,
166
  "apply_preset": {
167
  "target_module": [
168
- "JointTransformerBlock"
169
  ],
170
  "module_algo_map": {
171
- "FeedForward": {
172
  "factor": 6
173
- },
174
- "JointTransformerBlock": {
175
- "factor": 12
176
  }
177
  }
178
  }
 
143
  - Training steps: 100
144
  - Learning rate: 1e-05
145
  - Max grad norm: 0.01
146
+ - Effective batch size: 3
147
+ - Micro-batch size: 1
148
  - Gradient accumulation steps: 1
149
  - Number of GPUs: 3
150
  - Prediction type: flow-matching
151
  - Rescaled betas zero SNR: False
152
+ - Optimizer: optimi-stableadamw
153
  - Precision: Pure BF16
154
  - Quantised: Yes: int8-quanto
155
  - Xformers: Not used
 
165
  "factor": 12,
166
  "apply_preset": {
167
  "target_module": [
168
+ "Attention"
169
  ],
170
  "module_algo_map": {
171
+ "Attention": {
172
  "factor": 6
 
 
 
173
  }
174
  }
175
  }