attention_type: math backend: pytorch checkpoint_freq: 1 comet: false comet_name: particleflow-pt comet_offline: false comet_step_freq: 100 config: parameters/pytorch/pyg-cld.yaml conv_type: attention data_dir: tensorflow_datasets dataset: cld dtype: float32 gpu_batch_multiplier: 10 gpus: 2 load: null lr: 0.0001 lr_schedule: constant lr_schedule_config: onecycle: pct_start: 0.3 model: attention: activation: relu attention_type: math conv_type: attention dropout_conv_id_ff: 0.0 dropout_conv_id_mha: 0.0 dropout_conv_reg_ff: 0.0 dropout_conv_reg_mha: 0.0 dropout_ff: 0.0 head_dim: 16 num_convs: 3 num_heads: 32 cos_phi_mode: linear energy_mode: linear eta_mode: linear gnn_lsh: activation: elu bin_size: 640 conv_type: gnn_lsh distance_dim: 128 dropout: 0.0 embedding_dim: 512 ffn_dist_hidden_dim: 128 ffn_dist_num_layers: 2 layernorm: true max_num_bins: 200 num_convs: 3 num_node_messages: 2 width: 512 input_encoding: joint learned_representation_mode: last mamba: activation: elu conv_type: mamba d_conv: 4 d_state: 16 dropout: 0.0 embedding_dim: 128 expand: 2 num_convs: 2 num_heads: 2 width: 128 pt_mode: linear sin_phi_mode: linear trainable: all ntest: null ntrain: 1000 num_epochs: 100 num_workers: 2 nvalid: 1000 patience: 20 prefetch_factor: 2 prefix: /pfvol/experiments/Aug26_CLD_fromscratch_1k_ ray_train: false raytune: asha: brackets: 1 grace_period: 10 max_t: 200 reduction_factor: 4 default_metric: val_loss default_mode: min hyperband: max_t: 200 reduction_factor: 4 hyperopt: n_random_steps: 10 local_dir: null nevergrad: n_random_steps: 10 sched: asha search_alg: null sort_data: false test_dataset: cld_edm_ttbar_pf: version: 2.0.0 test_datasets: [] train: true train_dataset: cld: physical: batch_size: 1 samples: cld_edm_ttbar_pf: version: 2.0.0 val_freq: null valid_dataset: cld: physical: batch_size: 1 samples: cld_edm_ttbar_pf: version: 2.0.0