| backend: pytorch | |
| checkpoint_freq: 1 | |
| comet: false | |
| comet_name: particleflow-pt | |
| comet_offline: false | |
| comet_step_freq: 100 | |
| config: parameters/pytorch/pyg-clic.yaml | |
| conv_type: attention | |
| data_dir: /scratch/project_465000301/tensorflow_datasets | |
| dataset: clic | |
| dtype: bfloat16 | |
| gpu_batch_multiplier: 128 | |
| gpus: 8 | |
| load: experiments/pyg-clic_20241011_102451_167094/checkpoints/checkpoint-22-1.913142.pth | |
| lr: 0.0001 | |
| lr_schedule: cosinedecay | |
| lr_schedule_config: | |
| onecycle: | |
| pct_start: 0.3 | |
| model: | |
| attention: | |
| activation: gelu | |
| attention_type: math | |
| conv_type: attention | |
| dropout_conv_id_ff: 0.0 | |
| dropout_conv_id_mha: 0.0 | |
| dropout_conv_reg_ff: 0.1 | |
| dropout_conv_reg_mha: 0.1 | |
| dropout_ff: 0.1 | |
| head_dim: 32 | |
| num_convs: 6 | |
| num_heads: 32 | |
| use_pre_layernorm: true | |
| cos_phi_mode: linear | |
| energy_mode: direct-elemtype-split | |
| eta_mode: linear | |
| gnn_lsh: | |
| activation: elu | |
| bin_size: 32 | |
| conv_type: gnn_lsh | |
| distance_dim: 128 | |
| embedding_dim: 512 | |
| ffn_dist_hidden_dim: 128 | |
| ffn_dist_num_layers: 2 | |
| layernorm: true | |
| max_num_bins: 200 | |
| num_convs: 8 | |
| num_node_messages: 2 | |
| width: 512 | |
| input_encoding: split | |
| learned_representation_mode: last | |
| mamba: | |
| activation: elu | |
| conv_type: mamba | |
| d_conv: 4 | |
| d_state: 16 | |
| dropout: 0.0 | |
| embedding_dim: 128 | |
| expand: 2 | |
| num_convs: 2 | |
| num_heads: 2 | |
| width: 128 | |
| pt_mode: direct-elemtype-split | |
| sin_phi_mode: linear | |
| trainable: all | |
| ntest: null | |
| ntrain: null | |
| num_epochs: 30 | |
| num_workers: 8 | |
| nvalid: null | |
| patience: 20 | |
| prefetch_factor: 100 | |
| ray_train: false | |
| raytune: | |
| asha: | |
| brackets: 1 | |
| grace_period: 10 | |
| max_t: 200 | |
| reduction_factor: 4 | |
| default_metric: val_loss | |
| default_mode: min | |
| hyperband: | |
| max_t: 200 | |
| reduction_factor: 4 | |
| hyperopt: | |
| n_random_steps: 10 | |
| local_dir: null | |
| nevergrad: | |
| n_random_steps: 10 | |
| sched: null | |
| search_alg: null | |
| save_attention: true | |
| sort_data: false | |
| test_dataset: | |
| clic_edm_qq_pf: | |
| version: 2.3.0 | |
| clic_edm_ttbar_pf: | |
| version: 2.3.0 | |
| clic_edm_ww_fullhad_pf: | |
| version: 2.3.0 | |
| test_datasets: [] | |
| train: true | |
| train_dataset: | |
| clic: | |
| physical: | |
| batch_size: 1 | |
| samples: | |
| clic_edm_qq_pf: | |
| version: 2.3.0 | |
| clic_edm_ttbar_pf: | |
| version: 2.3.0 | |
| clic_edm_ww_fullhad_pf: | |
| version: 2.3.0 | |
| val_freq: null | |
| valid_dataset: | |
| clic: | |
| physical: | |
| batch_size: 1 | |
| samples: | |
| clic_edm_qq_pf: | |
| version: 2.3.0 | |
| clic_edm_ttbar_pf: | |
| version: 2.3.0 | |
| clic_edm_ww_fullhad_pf: | |
| version: 2.3.0 | |