|
checkpoint_freq: 1 |
|
comet: true |
|
comet_name: particleflow-pt |
|
comet_offline: false |
|
comet_step_freq: 100 |
|
conv_type: attention |
|
data_dir: /scratch/persistent/joosep/tensorflow_datasets |
|
dataset: clic |
|
dtype: float32 |
|
enabled_test_datasets: |
|
- clic_edm_qq_pf |
|
gpu_batch_multiplier: 256 |
|
gpus: 1 |
|
load: experiments/pyg-clic_20250106_193536_269746/checkpoints/checkpoint-01-2.431203.pth |
|
lr: 0.0001 |
|
lr_schedule: cosinedecay |
|
lr_schedule_config: |
|
onecycle: |
|
pct_start: 0.3 |
|
make_plots: null |
|
model: |
|
attention: |
|
activation: relu |
|
attention_type: math |
|
conv_type: attention |
|
dropout_conv_id_ff: 0.0 |
|
dropout_conv_id_mha: 0.0 |
|
dropout_conv_reg_ff: 0.0 |
|
dropout_conv_reg_mha: 0.0 |
|
dropout_ff: 0.0 |
|
head_dim: 32 |
|
num_convs: 3 |
|
num_heads: 32 |
|
use_pre_layernorm: true |
|
cos_phi_mode: linear |
|
energy_mode: direct-elemtype-split |
|
eta_mode: linear |
|
gnn_lsh: |
|
activation: elu |
|
bin_size: 32 |
|
conv_type: gnn_lsh |
|
distance_dim: 128 |
|
embedding_dim: 512 |
|
ffn_dist_hidden_dim: 128 |
|
ffn_dist_num_layers: 2 |
|
layernorm: true |
|
max_num_bins: 200 |
|
num_convs: 8 |
|
num_node_messages: 2 |
|
width: 512 |
|
input_encoding: split |
|
learned_representation_mode: last |
|
mamba: |
|
activation: elu |
|
conv_type: mamba |
|
d_conv: 4 |
|
d_state: 16 |
|
dropout: 0.0 |
|
embedding_dim: 128 |
|
expand: 2 |
|
num_convs: 2 |
|
num_heads: 2 |
|
width: 128 |
|
pt_mode: direct-elemtype-split |
|
sin_phi_mode: linear |
|
trainable: all |
|
ntest: 2000 |
|
ntrain: null |
|
num_epochs: 10 |
|
num_workers: 8 |
|
nvalid: null |
|
patience: 20 |
|
prefetch_factor: 100 |
|
raytune: |
|
asha: |
|
brackets: 1 |
|
grace_period: 10 |
|
max_t: 200 |
|
reduction_factor: 4 |
|
default_metric: val_loss |
|
default_mode: min |
|
hyperband: |
|
max_t: 200 |
|
reduction_factor: 4 |
|
hyperopt: |
|
n_random_steps: 10 |
|
local_dir: null |
|
nevergrad: |
|
n_random_steps: 10 |
|
sched: null |
|
search_alg: null |
|
save_attention: true |
|
sort_data: false |
|
test: null |
|
test_dataset: |
|
clic_edm_qq_pf: |
|
splits: |
|
- 1 |
|
- 2 |
|
- 3 |
|
- 4 |
|
- 5 |
|
- 6 |
|
- 7 |
|
- 8 |
|
- 9 |
|
- 10 |
|
version: 2.5.0 |
|
clic_edm_ttbar_pf: |
|
splits: |
|
- 1 |
|
- 2 |
|
- 3 |
|
- 4 |
|
- 5 |
|
- 6 |
|
- 7 |
|
- 8 |
|
- 9 |
|
- 10 |
|
version: 2.5.0 |
|
clic_edm_ww_fullhad_pf: |
|
splits: |
|
- 1 |
|
- 2 |
|
- 3 |
|
- 4 |
|
- 5 |
|
- 6 |
|
- 7 |
|
- 8 |
|
- 9 |
|
- 10 |
|
version: 2.5.0 |
|
train: true |
|
train_dataset: |
|
clic: |
|
physical: |
|
batch_size: 1 |
|
samples: |
|
clic_edm_qq_pf: |
|
splits: |
|
- 1 |
|
- 2 |
|
- 3 |
|
- 4 |
|
- 5 |
|
- 6 |
|
- 7 |
|
- 8 |
|
- 9 |
|
- 10 |
|
version: 2.5.0 |
|
clic_edm_ttbar_pf: |
|
splits: |
|
- 1 |
|
- 2 |
|
- 3 |
|
- 4 |
|
- 5 |
|
- 6 |
|
- 7 |
|
- 8 |
|
- 9 |
|
- 10 |
|
version: 2.5.0 |
|
clic_edm_ww_fullhad_pf: |
|
splits: |
|
- 1 |
|
- 2 |
|
- 3 |
|
- 4 |
|
- 5 |
|
- 6 |
|
- 7 |
|
- 8 |
|
- 9 |
|
- 10 |
|
version: 2.5.0 |
|
val_freq: null |
|
valid_dataset: |
|
clic: |
|
physical: |
|
batch_size: 1 |
|
samples: |
|
clic_edm_qq_pf: |
|
splits: |
|
- 1 |
|
- 2 |
|
- 3 |
|
- 4 |
|
- 5 |
|
- 6 |
|
- 7 |
|
- 8 |
|
- 9 |
|
- 10 |
|
version: 2.5.0 |
|
clic_edm_ttbar_pf: |
|
splits: |
|
- 1 |
|
- 2 |
|
- 3 |
|
- 4 |
|
- 5 |
|
- 6 |
|
- 7 |
|
- 8 |
|
- 9 |
|
- 10 |
|
version: 2.5.0 |
|
clic_edm_ww_fullhad_pf: |
|
splits: |
|
- 1 |
|
- 2 |
|
- 3 |
|
- 4 |
|
- 5 |
|
- 6 |
|
- 7 |
|
- 8 |
|
- 9 |
|
- 10 |
|
version: 2.5.0 |
|
|