File size: 2,442 Bytes
652e089
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
backend: pytorch
checkpoint_freq: 1
comet: true
comet_name: particleflow-pt
comet_offline: false
comet_step_freq: 10
config: parameters/pytorch/pyg-cms.yaml
conv_type: attention
data_dir: /scratch/persistent/joosep/tensorflow_datasets
dataset: cms
dtype: bfloat16
gpu_batch_multiplier: 20
gpus: 1
load: null
lr: 0.0001
lr_schedule: cosinedecay
lr_schedule_config:
  onecycle:
    pct_start: 0.3
model:
  attention:
    activation: relu
    attention_type: flash
    conv_type: attention
    dropout_conv_id_ff: 0.0
    dropout_conv_id_mha: 0.0
    dropout_conv_reg_ff: 0.0
    dropout_conv_reg_mha: 0.0
    dropout_ff: 0.0
    head_dim: 16
    num_convs: 6
    num_heads: 32
  cos_phi_mode: linear
  energy_mode: linear
  eta_mode: linear
  gnn_lsh:
    activation: elu
    bin_size: 640
    conv_type: gnn_lsh
    distance_dim: 128
    dropout_ff: 0.0
    embedding_dim: 512
    ffn_dist_hidden_dim: 128
    ffn_dist_num_layers: 2
    layernorm: true
    max_num_bins: 200
    num_convs: 3
    num_node_messages: 2
    width: 512
  gravnet:
    activation: elu
    conv_type: gravnet
    dropout_ff: 0.1
    embedding_dim: 512
    k: 16
    num_convs: 3
    propagate_dimensions: 32
    space_dimensions: 4
    width: 512
  input_encoding: joint
  learned_representation_mode: last
  mamba:
    activation: elu
    conv_type: mamba
    d_conv: 4
    d_state: 32
    dropout_ff: 0.0
    embedding_dim: 1024
    expand: 2
    num_convs: 4
    width: 1024
  pt_mode: linear
  sin_phi_mode: linear
  trainable: all
ntest: null
ntrain: null
num_epochs: 100
num_workers: 4
nvalid: null
patience: 20
prefetch_factor: 50
ray_train: false
raytune:
  asha:
    brackets: 1
    grace_period: 10
    max_t: 200
    reduction_factor: 4
  default_metric: val_loss
  default_mode: min
  hyperband:
    max_t: 200
    reduction_factor: 4
  hyperopt:
    n_random_steps: 10
  local_dir: null
  nevergrad:
    n_random_steps: 10
  sched: asha
  search_alg: hyperopt
sort_data: true
test_dataset:
  cms_pf_qcd:
    version: 1.7.0
  cms_pf_qcd_high_pt:
    version: 1.7.0
  cms_pf_sms_t1tttt:
    version: 1.7.0
  cms_pf_ttbar:
    version: 1.7.1
  cms_pf_ztt:
    version: 1.7.0
test_datasets: []
train: true
train_dataset:
  cms:
    physical:
      batch_size: 1
      samples:
        cms_pf_ttbar:
          version: 1.7.1
val_freq: null
valid_dataset:
  cms:
    physical:
      batch_size: 1
      samples:
        cms_pf_ttbar:
          version: 1.7.1