backend: pytorch checkpoint_freq: null comet: false comet_name: particleflow-pt comet_offline: false comet_step_freq: 100 config: parameters/pytorch/pyg-clic.yaml conv_type: attention data_dir: /scratch/persistent/joosep/tensorflow_datasets dataset: clic dtype: bfloat16 gpu_batch_multiplier: 100 gpus: 1 load: experiments/pyg-clic_20241001_215132_345408/checkpoints/checkpoint-26-2.004527.pth lr: 0.0001 lr_schedule: cosinedecay lr_schedule_config: onecycle: pct_start: 0.3 make_plots: true model: attention: activation: gelu attention_type: math conv_type: attention dropout_conv_id_ff: 0.0 dropout_conv_id_mha: 0.0 dropout_conv_reg_ff: 0.1 dropout_conv_reg_mha: 0.1 dropout_ff: 0.1 head_dim: 32 num_convs: 4 num_heads: 32 use_pre_layernorm: true cos_phi_mode: linear energy_mode: direct-elemtype-split eta_mode: linear gnn_lsh: activation: elu bin_size: 32 conv_type: gnn_lsh distance_dim: 128 embedding_dim: 512 ffn_dist_hidden_dim: 128 ffn_dist_num_layers: 2 layernorm: true max_num_bins: 200 num_convs: 8 num_node_messages: 2 width: 512 input_encoding: split learned_representation_mode: last mamba: activation: elu conv_type: mamba d_conv: 4 d_state: 16 dropout: 0.0 embedding_dim: 128 expand: 2 num_convs: 2 num_heads: 2 width: 128 pt_mode: direct-elemtype-split sin_phi_mode: linear trainable: all ntest: null ntrain: null num_epochs: 100 num_workers: 8 nvalid: null patience: 20 prefetch_factor: 10 ray_train: false raytune: asha: brackets: 1 grace_period: 10 max_t: 200 reduction_factor: 4 default_metric: val_loss default_mode: min hyperband: max_t: 200 reduction_factor: 4 hyperopt: n_random_steps: 10 local_dir: null nevergrad: n_random_steps: 10 sched: null search_alg: null save_attention: true sort_data: false test: true test_dataset: clic_edm_qq_pf: version: 2.2.0 clic_edm_ttbar_pf: version: 2.2.0 clic_edm_ww_fullhad_pf: version: 2.2.0 test_datasets: [] train_dataset: clic: physical: batch_size: 1 samples: clic_edm_qq_pf: version: 2.2.0 clic_edm_ttbar_pf: version: 2.2.0 clic_edm_ww_fullhad_pf: version: 2.2.0 val_freq: null valid_dataset: clic: physical: batch_size: 1 samples: clic_edm_qq_pf: version: 2.2.0 clic_edm_ttbar_pf: version: 2.2.0 clic_edm_ww_fullhad_pf: version: 2.2.0