Joosep Pata commited on
Commit
fd4e297
•
1 Parent(s): 18d58e0

add CMS benchmark model

Browse files
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  weights-96-5.346523.hdf5 filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  weights-96-5.346523.hdf5 filter=lfs diff=lfs merge=lfs -text
37
+ *.hdf5 filter=lfs diff=lfs merge=lfs -text
opt-96-5.346523.pkl → clic/clusters/v1.6/opt-96-5.346523.pkl RENAMED
File without changes
weights-96-5.346523.hdf5 → clic/clusters/v1.6/weights-96-5.346523.hdf5 RENAMED
File without changes
cms/2023_10_12/config.yaml ADDED
@@ -0,0 +1,323 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ backend: tensorflow
2
+
3
+ cache: caches/cms_gen
4
+
5
+ dataset:
6
+ schema: cms
7
+ target_particles: gen
8
+ num_input_features: 42
9
+ # NONE = 0,
10
+ # TRACK = 1,
11
+ # PS1 = 2,
12
+ # PS2 = 3,
13
+ # ECAL = 4,
14
+ # HCAL = 5,
15
+ # GSF = 6,
16
+ # BREM = 7,
17
+ # HFEM = 8,
18
+ # HFHAD = 9,
19
+ # SC = 10,
20
+ # HO = 11,
21
+ num_input_classes: 12
22
+ #(none=0, ch.had=1, n.had=2, hfem=3, hfhad=4, gamma=5, e=6, mu=7)
23
+ num_output_classes: 8
24
+ padded_num_elem_size: 6400
25
+ cls_weight_by_pt: no
26
+ reg_weight_by_pt: no
27
+ enable_tfds_caching: no
28
+
29
+ loss:
30
+ classification_loss_coef: 100.0
31
+ charge_loss_coef: 1.0
32
+ pt_loss_coef: 1.0
33
+ eta_loss_coef: 1.0
34
+ sin_phi_loss_coef: 1.0
35
+ cos_phi_loss_coef: 1.0
36
+ energy_loss_coef: 1.0
37
+ cls_loss:
38
+ type: SigmoidFocalCrossEntropy
39
+ from_logits: yes
40
+ gamma: 2.0
41
+ charge_loss:
42
+ type: CategoricalCrossentropy
43
+ from_logits: yes
44
+ energy_loss:
45
+ type: Huber
46
+ pt_loss:
47
+ type: Huber
48
+ sin_phi_loss:
49
+ type: Huber
50
+ delta: 0.1
51
+ cos_phi_loss:
52
+ type: Huber
53
+ delta: 0.1
54
+ eta_loss:
55
+ type: Huber
56
+ delta: 0.1
57
+ event_loss: none #none, sliced_wasserstein, gen_jet_logcosh, gen_jet_mse, hist_2d
58
+ event_loss_coef: 1.0
59
+ met_loss: none
60
+ met_loss_coef: 1.0
61
+
62
+ tensorflow:
63
+ eager: no
64
+
65
+ setup:
66
+ train: yes
67
+ weights:
68
+ weights_config:
69
+ lr: 0.00005
70
+ num_epochs: 55
71
+ dtype: float32
72
+ trainable:
73
+ lr_schedule: none # cosinedecay, exponentialdecay, onecycle, none
74
+ optimizer: adam # adam, adamw, sgd
75
+ horovod_enabled: no
76
+ cls_output_as_logits: yes
77
+ #if enabled, do not create LSH bins for small graphs (less than one bin size)
78
+ #enabling results in some speedup for gun samples, but must be disabled for XLA
79
+ small_graph_opt: yes
80
+ use_normalizer: no
81
+
82
+ batching:
83
+ # if enabled, use dynamic batching instead of the fixed-size batches configured in batch_per_gpu
84
+ bucket_by_sequence_length: yes
85
+ bucket_batch_sizes: auto
86
+ batch_multiplier: 1
87
+
88
+ optimizer:
89
+ adam:
90
+ amsgrad: no
91
+ adamw:
92
+ amsgrad: yes
93
+ weight_decay: 0.001
94
+ sgd:
95
+ nesterov: no
96
+ momentum: 0.9
97
+
98
+ # LR Schedules
99
+ exponentialdecay:
100
+ decay_steps: 2000
101
+ decay_rate: 0.99
102
+ staircase: yes
103
+ onecycle:
104
+ mom_min: 0.85
105
+ mom_max: 0.95
106
+ warmup_ratio: 0.3
107
+ div_factor: 25.0
108
+ final_div: 100000.0
109
+
110
+ parameters:
111
+ model: gnn_dense
112
+ input_encoding: cms
113
+ node_update_mode: additive
114
+ do_node_encoding: yes
115
+ node_encoding_hidden_dim: 512
116
+
117
+ combined_graph_layer:
118
+ bin_size: 640
119
+ max_num_bins: 200
120
+ distance_dim: 128
121
+ layernorm: yes
122
+ dropout: 0.0
123
+ dist_activation: elu
124
+ ffn_dist_num_layers: 2
125
+ ffn_dist_hidden_dim: 128
126
+
127
+ # GCN
128
+ kernel:
129
+ type: NodePairGaussianKernel
130
+ dist_mult: 0.1
131
+ clip_value_low: 0.0
132
+ dist_norm: l2
133
+ num_node_messages: 2
134
+ node_message:
135
+ type: GHConvDense
136
+ output_dim: 512
137
+ activation: elu
138
+ #if this is enabled, it will break float16 training
139
+ normalize_degrees: no
140
+ activation: elu
141
+
142
+ num_graph_layers_id: 3
143
+ num_graph_layers_reg: 3
144
+ output_decoding:
145
+ activation: elu
146
+ regression_use_classification: yes
147
+ dropout: 0.1
148
+
149
+ pt_as_correction: yes
150
+
151
+ id_dim_decrease: yes
152
+ charge_dim_decrease: yes
153
+ pt_dim_decrease: yes
154
+ eta_dim_decrease: yes
155
+ phi_dim_decrease: yes
156
+ energy_dim_decrease: yes
157
+
158
+ id_hidden_dim: 512
159
+ charge_hidden_dim: 256
160
+ pt_hidden_dim: 512
161
+ eta_hidden_dim: 256
162
+ phi_hidden_dim: 256
163
+ energy_hidden_dim: 512
164
+
165
+ id_num_layers: 3
166
+ charge_num_layers: 2
167
+ pt_num_layers: 2
168
+ eta_num_layers: 2
169
+ phi_num_layers: 2
170
+ energy_num_layers: 2
171
+ layernorm: yes
172
+ mask_reg_cls0: yes
173
+
174
+ skip_connection: no
175
+ debug: no
176
+
177
+ timing:
178
+ num_ev: 100
179
+ num_iter: 3
180
+
181
+ callbacks:
182
+ checkpoint:
183
+ monitor: "val_loss"
184
+ plot_freq: 1
185
+ tensorboard:
186
+ dump_history: yes
187
+ hist_freq: 1
188
+
189
+ hypertune:
190
+ algorithm: hyperband # random, bayesian, hyperband
191
+ random:
192
+ objective: val_loss
193
+ max_trials: 100
194
+ bayesian:
195
+ objective: val_loss
196
+ max_trials: 100
197
+ num_initial_points: 2
198
+ hyperband:
199
+ objective: val_loss
200
+ max_epochs: 10
201
+ factor: 3
202
+ iterations: 1
203
+ executions_per_trial: 1
204
+
205
+ raytune:
206
+ local_dir: # Note: please specify an absolute path
207
+ sched: asha # asha, hyperband
208
+ search_alg: # bayes, bohb, hyperopt, nevergrad, scikit
209
+ default_metric: "val_loss"
210
+ default_mode: "min"
211
+ # Tune schedule specific parameters
212
+ asha:
213
+ max_t: 200
214
+ reduction_factor: 4
215
+ brackets: 1
216
+ grace_period: 10
217
+ hyperband:
218
+ max_t: 200
219
+ reduction_factor: 4
220
+ hyperopt:
221
+ n_random_steps: 10
222
+ nevergrad:
223
+ n_random_steps: 10
224
+
225
+ train_test_datasets:
226
+ multiparticlegun:
227
+ batch_per_gpu: 1
228
+ event_pad_size: -1
229
+ datasets:
230
+ - cms_pf_multi_particle_gun
231
+ physical:
232
+ batch_per_gpu: 1
233
+ event_pad_size: -1
234
+ datasets:
235
+ - cms_pf_ttbar
236
+ - cms_pf_ztt
237
+ - cms_pf_qcd
238
+ - cms_pf_qcd_high_pt
239
+ - cms_pf_sms_t1tttt
240
+ gun:
241
+ batch_per_gpu: 50
242
+ event_pad_size: -1
243
+ datasets:
244
+ - cms_pf_single_electron
245
+ - cms_pf_single_gamma
246
+ - cms_pf_single_neutron
247
+ - cms_pf_single_pi0
248
+ - cms_pf_single_pi
249
+ - cms_pf_single_tau
250
+ - cms_pf_single_mu
251
+ - cms_pf_single_proton
252
+
253
+ evaluation_datasets:
254
+ cms_pf_qcd_high_pt:
255
+ batch_size: 5
256
+ num_events: -1
257
+ cms_pf_single_neutron:
258
+ batch_size: 100
259
+ num_events: -1
260
+
261
+ validation_dataset: cms_pf_qcd_high_pt
262
+ validation_batch_size: 5
263
+ validation_num_events: 500
264
+
265
+ evaluation_jet_algo: antikt_algorithm
266
+
267
+ datasets:
268
+ cms_pf_ttbar:
269
+ version: 1.6.0
270
+ data_dir:
271
+ manual_dir:
272
+ cms_pf_ztt:
273
+ version: 1.6.0
274
+ data_dir:
275
+ manual_dir:
276
+ cms_pf_qcd:
277
+ version: 1.6.0
278
+ data_dir:
279
+ manual_dir:
280
+ cms_pf_qcd_high_pt:
281
+ version: 1.6.0
282
+ data_dir:
283
+ manual_dir:
284
+ cms_pf_single_electron:
285
+ version: 1.6.0
286
+ data_dir:
287
+ manual_dir:
288
+ cms_pf_single_gamma:
289
+ version: 1.6.0
290
+ data_dir:
291
+ manual_dir:
292
+ cms_pf_single_pi0:
293
+ version: 1.6.0
294
+ data_dir:
295
+ manual_dir:
296
+ cms_pf_single_neutron:
297
+ version: 1.6.0
298
+ data_dir:
299
+ manual_dir:
300
+ cms_pf_single_pi:
301
+ version: 1.6.0
302
+ data_dir:
303
+ manual_dir:
304
+ cms_pf_single_tau:
305
+ version: 1.6.0
306
+ data_dir:
307
+ manual_dir:
308
+ cms_pf_single_mu:
309
+ version: 1.6.0
310
+ data_dir:
311
+ manual_dir:
312
+ cms_pf_single_proton:
313
+ version: 1.6.0
314
+ data_dir:
315
+ manual_dir:
316
+ cms_pf_multi_particle_gun:
317
+ version: 1.6.0
318
+ data_dir:
319
+ manual_dir:
320
+ cms_pf_sms_t1tttt:
321
+ version: 1.6.0
322
+ data_dir:
323
+ manual_dir:
cms/2023_10_12/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6809bca035cac27e8f5d7ec43daf577902df9ec87a3ecb7cc5f524f5f9a1ca32
3
+ size 51061251
cms/2023_10_12/opt-51-1.401646.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ae8a3bc9a2f9dfb2d61cbb4cac572298d13fb19ad13bcb55046c9a2f3b1550d
3
+ size 100770916
cms/2023_10_12/weights-51-1.401646.hdf5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17dd37ff89dac79c3b9185814cb1c4c669959fa320a254264a35394786ac06ed
3
+ size 50828328