File size: 1,093 Bytes
393bfc7 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 |
{
"codebook_embed_dim": 64,
"codebook_l2_norm": true,
"codebook_show_usage": true,
"codebook_size": 8192,
"commit_loss_beta": 0.25,
"dec_drop_path_rate": 0.0,
"dec_patch_size": 16,
"dec_pretrained": false,
"dec_tuning_method": "full",
"dec_type": "vit",
"decoder_ch_mult": [
1,
1,
2,
2,
4
],
"decoder_model": "vit_large_patch14_dinov2.lvd142m",
"dropout_p": 0.0,
"enc_drop_path_rate": 0.0,
"enc_patch_size": 16,
"enc_pretrained": true,
"enc_tuning_method": "full",
"enc_type": "vit",
"encoder_ch_mult": [
1,
1,
2,
2,
4
],
"encoder_model": "vit_base_patch14_dinov2.lvd142m",
"entropy_loss_ratio": 0.0,
"image_size": 256,
"kl_loss_weight": 1e-06,
"num_codebooks": 4,
"num_latent_tokens": 32,
"repa": false,
"repa_align": "global",
"repa_layer_indices": [
8
],
"repa_loss_weight": 0.1,
"repa_model": "vit_base_patch16_224",
"repa_patch_size": 16,
"repa_proj_dim": 2048,
"tau": 0.07,
"vq_loss_ratio": 1.0,
"vq_mean": 0.0010870857,
"vq_std": 0.028672216,
"z_channels": 256
} |