backend: pytorch | |
checkpoint_freq: null | |
comet: false | |
comet_name: particleflow-pt | |
comet_offline: false | |
comet_step_freq: 100 | |
config: parameters/pytorch/pyg-clic.yaml | |
conv_type: attention | |
data_dir: /scratch/persistent/joosep/tensorflow_datasets | |
dataset: clic | |
dtype: bfloat16 | |
gpu_batch_multiplier: 100 | |
gpus: 1 | |
load: experiments/pyg-clic_20241001_215132_345408/checkpoints/checkpoint-26-2.004527.pth | |
lr: 0.0001 | |
lr_schedule: cosinedecay | |
lr_schedule_config: | |
onecycle: | |
pct_start: 0.3 | |
make_plots: true | |
model: | |
attention: | |
activation: gelu | |
attention_type: math | |
conv_type: attention | |
dropout_conv_id_ff: 0.0 | |
dropout_conv_id_mha: 0.0 | |
dropout_conv_reg_ff: 0.1 | |
dropout_conv_reg_mha: 0.1 | |
dropout_ff: 0.1 | |
head_dim: 32 | |
num_convs: 4 | |
num_heads: 32 | |
use_pre_layernorm: true | |
cos_phi_mode: linear | |
energy_mode: direct-elemtype-split | |
eta_mode: linear | |
gnn_lsh: | |
activation: elu | |
bin_size: 32 | |
conv_type: gnn_lsh | |
distance_dim: 128 | |
embedding_dim: 512 | |
ffn_dist_hidden_dim: 128 | |
ffn_dist_num_layers: 2 | |
layernorm: true | |
max_num_bins: 200 | |
num_convs: 8 | |
num_node_messages: 2 | |
width: 512 | |
input_encoding: split | |
learned_representation_mode: last | |
mamba: | |
activation: elu | |
conv_type: mamba | |
d_conv: 4 | |
d_state: 16 | |
dropout: 0.0 | |
embedding_dim: 128 | |
expand: 2 | |
num_convs: 2 | |
num_heads: 2 | |
width: 128 | |
pt_mode: direct-elemtype-split | |
sin_phi_mode: linear | |
trainable: all | |
ntest: null | |
ntrain: null | |
num_epochs: 100 | |
num_workers: 8 | |
nvalid: null | |
patience: 20 | |
prefetch_factor: 10 | |
ray_train: false | |
raytune: | |
asha: | |
brackets: 1 | |
grace_period: 10 | |
max_t: 200 | |
reduction_factor: 4 | |
default_metric: val_loss | |
default_mode: min | |
hyperband: | |
max_t: 200 | |
reduction_factor: 4 | |
hyperopt: | |
n_random_steps: 10 | |
local_dir: null | |
nevergrad: | |
n_random_steps: 10 | |
sched: null | |
search_alg: null | |
save_attention: true | |
sort_data: false | |
test: true | |
test_dataset: | |
clic_edm_qq_pf: | |
version: 2.2.0 | |
clic_edm_ttbar_pf: | |
version: 2.2.0 | |
clic_edm_ww_fullhad_pf: | |
version: 2.2.0 | |
test_datasets: [] | |
train_dataset: | |
clic: | |
physical: | |
batch_size: 1 | |
samples: | |
clic_edm_qq_pf: | |
version: 2.2.0 | |
clic_edm_ttbar_pf: | |
version: 2.2.0 | |
clic_edm_ww_fullhad_pf: | |
version: 2.2.0 | |
val_freq: null | |
valid_dataset: | |
clic: | |
physical: | |
batch_size: 1 | |
samples: | |
clic_edm_qq_pf: | |
version: 2.2.0 | |
clic_edm_ttbar_pf: | |
version: 2.2.0 | |
clic_edm_ww_fullhad_pf: | |
version: 2.2.0 | |