nielsgl commited on
Commit
a2e9761
1 Parent(s): 16cacad

Push Keras model using huggingface_hub.

Browse files
.gitattributes CHANGED
@@ -32,3 +32,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
32
  *.zip filter=lfs diff=lfs merge=lfs -text
33
  *.zst filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: keras
3
+ ---
4
+
5
+ ## Model description
6
+
7
+ More information needed
8
+
9
+ ## Intended uses & limitations
10
+
11
+ More information needed
12
+
13
+ ## Training and evaluation data
14
+
15
+ More information needed
16
+
17
+ ## Training procedure
18
+
19
+ ### Training hyperparameters
20
+
21
+ The following hyperparameters were used during training:
22
+
23
+ | Hyperparameters | Value |
24
+ | :-- | :-- |
25
+ | name | RMSprop |
26
+ | weight_decay | None |
27
+ | clipnorm | None |
28
+ | global_clipnorm | None |
29
+ | clipvalue | None |
30
+ | use_ema | False |
31
+ | ema_momentum | 0.99 |
32
+ | ema_overwrite_frequency | 100 |
33
+ | jit_compile | True |
34
+ | is_legacy_optimizer | False |
35
+ | learning_rate | 0.0010000000474974513 |
36
+ | rho | 0.9 |
37
+ | momentum | 0.0 |
38
+ | epsilon | 1e-07 |
39
+ | centered | False |
40
+ | training_precision | float32 |
41
+
config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"name": "diffusion_model_v2_1", "layers": [{"class_name": "InputLayer", "config": {"batch_input_shape": [null, 320], "dtype": "float32", "sparse": false, "ragged": false, "name": "input_5"}, "name": "input_5", "inbound_nodes": []}, {"class_name": "Dense", "config": {"name": "dense_216", "trainable": true, "dtype": "float32", "units": 1280, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}}, "bias_initializer": {"class_name": "Zeros", "config": {}}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "name": "dense_216", "inbound_nodes": [[["input_5", 0, 0, {}]]]}, {"class_name": "InputLayer", "config": {"batch_input_shape": [null, 64, 64, 4], "dtype": "float32", "sparse": false, "ragged": false, "name": "input_6"}, "name": "input_6", "inbound_nodes": []}, {"class_name": "Activation", "config": {"name": "activation_68", "trainable": true, "dtype": "float32", "activation": "swish"}, "name": "activation_68", "inbound_nodes": [[["dense_216", 0, 0, {}]]]}, {"class_name": "PaddedConv2D", "config": {"name": "padded_conv2d_52", "trainable": true, "dtype": "float32", "kernel_size": 3, "padding": 1, "filters": 320}, "name": "padded_conv2d_52", "inbound_nodes": [[["input_6", 0, 0, {}]]]}, {"class_name": "Dense", "config": {"name": "dense_217", "trainable": true, "dtype": "float32", "units": 1280, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}}, "bias_initializer": {"class_name": "Zeros", "config": {}}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "name": "dense_217", "inbound_nodes": [[["activation_68", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_22", "trainable": true, "dtype": "float32", "output_dim": 320}, "name": "res_block_22", "inbound_nodes": [[["padded_conv2d_52", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "InputLayer", "config": {"batch_input_shape": [null, 77, 1024], "dtype": "float32", "sparse": false, "ragged": false, "name": "input_4"}, "name": "input_4", "inbound_nodes": []}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_16", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 5, "head_size": 64}, "name": "spatial_transformer_16", "inbound_nodes": [[["res_block_22", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_23", "trainable": true, "dtype": "float32", "output_dim": 320}, "name": "res_block_23", "inbound_nodes": [[["spatial_transformer_16", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_17", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 5, "head_size": 64}, "name": "spatial_transformer_17", "inbound_nodes": [[["res_block_23", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "PaddedConv2D", "config": {"name": "padded_conv2d_57", "trainable": true, "dtype": "float32", "strides": 2, "padding": 1, "filters": 320, "kernel_size": 3}, "name": "padded_conv2d_57", "inbound_nodes": [[["spatial_transformer_17", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_24", "trainable": true, "dtype": "float32", "output_dim": 640}, "name": "res_block_24", "inbound_nodes": [[["padded_conv2d_57", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_18", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 10, "head_size": 64}, "name": "spatial_transformer_18", "inbound_nodes": [[["res_block_24", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_25", "trainable": true, "dtype": "float32", "output_dim": 640}, "name": "res_block_25", "inbound_nodes": [[["spatial_transformer_18", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_19", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 10, "head_size": 64}, "name": "spatial_transformer_19", "inbound_nodes": [[["res_block_25", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "PaddedConv2D", "config": {"name": "padded_conv2d_62", "trainable": true, "dtype": "float32", "strides": 2, "padding": 1, "filters": 640, "kernel_size": 3}, "name": "padded_conv2d_62", "inbound_nodes": [[["spatial_transformer_19", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_26", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_26", "inbound_nodes": [[["padded_conv2d_62", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_20", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 20, "head_size": 64}, "name": "spatial_transformer_20", "inbound_nodes": [[["res_block_26", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_27", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_27", "inbound_nodes": [[["spatial_transformer_20", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_21", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 20, "head_size": 64}, "name": "spatial_transformer_21", "inbound_nodes": [[["res_block_27", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "PaddedConv2D", "config": {"name": "padded_conv2d_67", "trainable": true, "dtype": "float32", "strides": 2, "padding": 1, "filters": 1280, "kernel_size": 3}, "name": "padded_conv2d_67", "inbound_nodes": [[["spatial_transformer_21", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_28", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_28", "inbound_nodes": [[["padded_conv2d_67", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_29", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_29", "inbound_nodes": [[["res_block_28", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_30", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_30", "inbound_nodes": [[["res_block_29", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_22", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 20, "head_size": 64}, "name": "spatial_transformer_22", "inbound_nodes": [[["res_block_30", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_31", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_31", "inbound_nodes": [[["spatial_transformer_22", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_12", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_12", "inbound_nodes": [[["res_block_31", 0, 0, {}], ["res_block_29", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_32", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_32", "inbound_nodes": [[["concatenate_12", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_13", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_13", "inbound_nodes": [[["res_block_32", 0, 0, {}], ["res_block_28", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_33", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_33", "inbound_nodes": [[["concatenate_13", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_14", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_14", "inbound_nodes": [[["res_block_33", 0, 0, {}], ["padded_conv2d_67", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_34", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_34", "inbound_nodes": [[["concatenate_14", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "Upsample", "config": {"name": "upsample_3", "trainable": true, "dtype": "float32", "channels": 1280}, "name": "upsample_3", "inbound_nodes": [[["res_block_34", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_15", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_15", "inbound_nodes": [[["upsample_3", 0, 0, {}], ["spatial_transformer_21", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_35", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_35", "inbound_nodes": [[["concatenate_15", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_23", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 20, "head_size": 64}, "name": "spatial_transformer_23", "inbound_nodes": [[["res_block_35", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_16", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_16", "inbound_nodes": [[["spatial_transformer_23", 0, 0, {}], ["spatial_transformer_20", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_36", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_36", "inbound_nodes": [[["concatenate_16", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_24", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 20, "head_size": 64}, "name": "spatial_transformer_24", "inbound_nodes": [[["res_block_36", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_17", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_17", "inbound_nodes": [[["spatial_transformer_24", 0, 0, {}], ["padded_conv2d_62", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_37", "trainable": true, "dtype": "float32", "output_dim": 1280}, "name": "res_block_37", "inbound_nodes": [[["concatenate_17", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_25", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 20, "head_size": 64}, "name": "spatial_transformer_25", "inbound_nodes": [[["res_block_37", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "Upsample", "config": {"name": "upsample_4", "trainable": true, "dtype": "float32", "channels": 1280}, "name": "upsample_4", "inbound_nodes": [[["spatial_transformer_25", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_18", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_18", "inbound_nodes": [[["upsample_4", 0, 0, {}], ["spatial_transformer_19", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_38", "trainable": true, "dtype": "float32", "output_dim": 640}, "name": "res_block_38", "inbound_nodes": [[["concatenate_18", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_26", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 10, "head_size": 64}, "name": "spatial_transformer_26", "inbound_nodes": [[["res_block_38", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_19", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_19", "inbound_nodes": [[["spatial_transformer_26", 0, 0, {}], ["spatial_transformer_18", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_39", "trainable": true, "dtype": "float32", "output_dim": 640}, "name": "res_block_39", "inbound_nodes": [[["concatenate_19", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_27", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 10, "head_size": 64}, "name": "spatial_transformer_27", "inbound_nodes": [[["res_block_39", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_20", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_20", "inbound_nodes": [[["spatial_transformer_27", 0, 0, {}], ["padded_conv2d_57", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_40", "trainable": true, "dtype": "float32", "output_dim": 640}, "name": "res_block_40", "inbound_nodes": [[["concatenate_20", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_28", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 10, "head_size": 64}, "name": "spatial_transformer_28", "inbound_nodes": [[["res_block_40", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "Upsample", "config": {"name": "upsample_5", "trainable": true, "dtype": "float32", "channels": 640}, "name": "upsample_5", "inbound_nodes": [[["spatial_transformer_28", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_21", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_21", "inbound_nodes": [[["upsample_5", 0, 0, {}], ["spatial_transformer_17", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_41", "trainable": true, "dtype": "float32", "output_dim": 320}, "name": "res_block_41", "inbound_nodes": [[["concatenate_21", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_29", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 5, "head_size": 64}, "name": "spatial_transformer_29", "inbound_nodes": [[["res_block_41", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_22", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_22", "inbound_nodes": [[["spatial_transformer_29", 0, 0, {}], ["spatial_transformer_16", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_42", "trainable": true, "dtype": "float32", "output_dim": 320}, "name": "res_block_42", "inbound_nodes": [[["concatenate_22", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_30", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 5, "head_size": 64}, "name": "spatial_transformer_30", "inbound_nodes": [[["res_block_42", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "Concatenate", "config": {"name": "concatenate_23", "trainable": true, "dtype": "float32", "axis": -1}, "name": "concatenate_23", "inbound_nodes": [[["spatial_transformer_30", 0, 0, {}], ["padded_conv2d_52", 0, 0, {}]]]}, {"class_name": "ResBlock", "config": {"name": "res_block_43", "trainable": true, "dtype": "float32", "output_dim": 320}, "name": "res_block_43", "inbound_nodes": [[["concatenate_23", 0, 0, {}], ["dense_217", 0, 0, {}]]]}, {"class_name": "SpatialTransformer", "config": {"name": "spatial_transformer_31", "trainable": true, "dtype": "float32", "fully_connected": true, "num_heads": 5, "head_size": 64}, "name": "spatial_transformer_31", "inbound_nodes": [[["res_block_43", 0, 0, {}], ["input_4", 0, 0, {}]]]}, {"class_name": "GroupNormalization", "config": {"name": "group_normalization_121", "trainable": true, "dtype": "float32", "groups": 32, "axis": -1, "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}}, "gamma_initializer": {"class_name": "Ones", "config": {}}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "name": "group_normalization_121", "inbound_nodes": [[["spatial_transformer_31", 0, 0, {}]]]}, {"class_name": "Activation", "config": {"name": "activation_135", "trainable": true, "dtype": "float32", "activation": "swish"}, "name": "activation_135", "inbound_nodes": [[["group_normalization_121", 0, 0, {}]]]}, {"class_name": "PaddedConv2D", "config": {"name": "padded_conv2d_103", "trainable": true, "dtype": "float32", "kernel_size": 3, "padding": 1, "filters": 4}, "name": "padded_conv2d_103", "inbound_nodes": [[["activation_135", 0, 0, {}]]]}], "input_layers": [["input_6", 0, 0], ["input_5", 0, 0], ["input_4", 0, 0]], "output_layers": [["padded_conv2d_103", 0, 0]]}
fingerprint.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b16228531a786827ee203eed188b8e00f36d61e894b08d5d5fdd0ff29cbaba8
3
+ size 54
keras_metadata.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f080a2c6ffad79698a6b4d2c93a939991d91927960c71f0a0c2e643279c4b135
3
+ size 680264
saved_model.pb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85e67012c303c6ba80b2c0a9d32432f398c47214086da9fdbb66425a3c464635
3
+ size 20050011
variables/variables.data-00000-of-00001 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f658ba99dab1708e941a903da7baf568da401e300a6ddb13b909b7cc1fb6c0ad
3
+ size 3464157998
variables/variables.index ADDED
Binary file (40.3 kB). View file