Joosep Pata
commited on
Commit
·
fc1d937
1
Parent(s):
8d52f2c
added 2.6.0pre1
Browse files- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/.gitattributes +6 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/checkpoints/checkpoint-10-3.812332.pth +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/checkpoints/mlpf_5M_attn2x3x256_bm12_relu_checkpoint10_8xmi250_fp32_fused_20250722.onnx +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/checkpoints/test_fp32_fused.onnx +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/checkpoints/test_fp32_unfused.onnx +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_1.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_10.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_2.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_3.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_4.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_5.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_6.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_7.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_8.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_9.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/hyperparameters.json +1 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/model_kwargs.pkl +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/train/events.out.tfevents.1752995498.nid006475.109881.0 +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/train/events.out.tfevents.1753086081.nid006574.78721.0 +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/train/events.out.tfevents.1753168805.nid005223.61027.0 +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/valid/events.out.tfevents.1752995498.nid006475.109881.1 +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/valid/events.out.tfevents.1753086081.nid006574.78721.1 +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/valid/events.out.tfevents.1753168805.nid005223.61027.1 +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/test-config.yaml +350 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/test.log +3 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/train-config.yaml +350 -0
- cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/train.log +3 -0
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/.gitattributes
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
plots_checkpoint*/** filter=lfs diff=lfs merge=lfs -text
|
2 |
+
preds_checkpoint*/** filter=lfs diff=lfs merge=lfs -text
|
3 |
+
runs/** filter=lfs diff=lfs merge=lfs -text
|
4 |
+
checkpoints/** filter=lfs diff=lfs merge=lfs -text
|
5 |
+
test.log filter=lfs diff=lfs merge=lfs -text
|
6 |
+
train.log filter=lfs diff=lfs merge=lfs -text
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/checkpoints/checkpoint-10-3.812332.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:110fcbe0fa3688f30413c470f1b32bc83e1ec6867f9ed4bc6b78890f46e4a779
|
3 |
+
size 61986481
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/checkpoints/mlpf_5M_attn2x3x256_bm12_relu_checkpoint10_8xmi250_fp32_fused_20250722.onnx
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
test_fp32_fused.onnx
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/checkpoints/test_fp32_fused.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bff46e3bc918bff466686e41f81530364f80a28af5a98e041d1bf726ea5c071a
|
3 |
+
size 20618493
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/checkpoints/test_fp32_unfused.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e8316ae25aba290b9914b8167090927cb3888f15312d156575011869f748735
|
3 |
+
size 20683040
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_1.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.3307875779200771, "Regression_eta": 0.0011008226799534677, "Regression_sin_phi": 0.0005952758953016243, "Regression_cos_phi": 0.0005989178986433796, "Regression_energy": 0.3821685668532535, "Classification_binary": 3.248547763328382, "Classification": 0.04140520995461081, "ispu": 0.06480694103454951, "MET": 32.3271596403628, "Sliced_Wasserstein_Loss": 141.8395379704832, "Total": 4.070012522516828}, "valid": {"Regression_pt": 0.3268018078071672, "Regression_eta": 0.0012236929862029994, "Regression_sin_phi": 0.0006016330100570523, "Regression_cos_phi": 0.0006014759630066543, "Regression_energy": 0.3711106926372298, "Classification_binary": 3.4719263278583616, "Classification": 0.04142742135283348, "ispu": 0.0847156685231353, "MET": 37.31766833759954, "Sliced_Wasserstein_Loss": 156.67726109215016, "Total": 4.298407336550768}, "epoch_train_time": 20054.613397359848, "epoch_valid_time": 522.0448796749115, "epoch_total_time": 20576.658277511597, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/med": 1.0948642752582765, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/iqr": 0.5352987897077894, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/match_frac": 0.16369763171345816}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_10.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.2945935354482034, "Regression_eta": 0.0010225383844258975, "Regression_sin_phi": 0.0005781889014534465, "Regression_cos_phi": 0.0005797894395897505, "Regression_energy": 0.34112146273464905, "Classification_binary": 3.0700406685522865, "Classification": 0.039839293544385805, "ispu": 0.05623641537153754, "MET": 22.359190816294284, "Sliced_Wasserstein_Loss": 135.51501121891098, "Total": 3.804006316562905}, "valid": {"Regression_pt": 0.2862994440315255, "Regression_eta": 0.001033568545006241, "Regression_sin_phi": 0.0005867550397488851, "Regression_cos_phi": 0.0005881994521929814, "Regression_energy": 0.333562753306314, "Classification_binary": 3.08993290715657, "Classification": 0.0398360199217639, "ispu": 0.060491833128077446, "MET": 22.22408720847554, "Sliced_Wasserstein_Loss": 136.78769375711036, "Total": 3.8123322401166098}, "epoch_train_time": 19872.13973236084, "epoch_valid_time": 463.1235797405243, "epoch_total_time": 20335.263313293457, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/med": 1.0302197649429803, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/iqr": 0.383474815733057, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/match_frac": 0.19645482712707218}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_2.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.3079458973943684, "Regression_eta": 0.0010340496249247586, "Regression_sin_phi": 0.0005833114312029109, "Regression_cos_phi": 0.0005848920176153752, "Regression_energy": 0.35468723458782353, "Classification_binary": 3.154964664380748, "Classification": 0.040555948855937725, "ispu": 0.0599413340331985, "MET": 26.020664127927187, "Sliced_Wasserstein_Loss": 137.99379009575577, "Total": 3.9203067226558796}, "valid": {"Regression_pt": 0.30669377905245665, "Regression_eta": 0.001126315542184181, "Regression_sin_phi": 0.0005949170109355003, "Regression_cos_phi": 0.000597158389693641, "Regression_energy": 0.35285923668142066, "Classification_binary": 3.364243091847981, "Classification": 0.04147878306175119, "ispu": 0.08028483038198148, "MET": 28.145975540386804, "Sliced_Wasserstein_Loss": 146.79876813139933, "Total": 4.147878392971417}, "epoch_train_time": 19856.485914468765, "epoch_valid_time": 460.6217374801636, "epoch_total_time": 20317.107652902603, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/med": 1.0729023270328226, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/iqr": 0.4602440467878818, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/match_frac": 0.180521111384561}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_3.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.3045270182188794, "Regression_eta": 0.0010309290788728452, "Regression_sin_phi": 0.0005820336769976094, "Regression_cos_phi": 0.0005835714666610519, "Regression_energy": 0.35119206484254023, "Classification_binary": 3.1324693158834496, "Classification": 0.040351018250728836, "ispu": 0.05891611392009093, "MET": 25.34442846759157, "Sliced_Wasserstein_Loss": 137.38605694782416, "Total": 3.8896569245172707}, "valid": {"Regression_pt": 0.30029078148330846, "Regression_eta": 0.001092079759864677, "Regression_sin_phi": 0.0005932266530458973, "Regression_cos_phi": 0.000595279317667053, "Regression_energy": 0.3470300667928754, "Classification_binary": 3.23416057842719, "Classification": 0.04083564853776708, "ispu": 0.07730574710919724, "MET": 25.860210466439135, "Sliced_Wasserstein_Loss": 141.70434264789534, "Total": 4.001901741592008}, "epoch_train_time": 19534.897091150284, "epoch_valid_time": 465.58784461021423, "epoch_total_time": 20000.484936475754, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/med": 1.0693435605624253, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/iqr": 0.42782200050126884, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/match_frac": 0.19049782607323829}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_4.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.3025986444474291, "Regression_eta": 0.001029179595994523, "Regression_sin_phi": 0.0005812856983235086, "Regression_cos_phi": 0.0005828826801102461, "Regression_energy": 0.3492268728470752, "Classification_binary": 3.114506219780046, "Classification": 0.04019495357632415, "ispu": 0.05913604339945841, "MET": 24.570153746484216, "Sliced_Wasserstein_Loss": 136.89236165976678, "Total": 3.867858313845084}, "valid": {"Regression_pt": 0.29682375546608364, "Regression_eta": 0.0010816555923704944, "Regression_sin_phi": 0.0005919490522356435, "Regression_cos_phi": 0.0005935601406943676, "Regression_energy": 0.3437563882074801, "Classification_binary": 3.20154766824872, "Classification": 0.04039814312167813, "ispu": 0.07327430212999503, "MET": 26.365443241609785, "Sliced_Wasserstein_Loss": 141.56762834186577, "Total": 3.9580697503377418}, "epoch_train_time": 19348.155507326126, "epoch_valid_time": 474.4926815032959, "epoch_total_time": 19822.64818930626}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_5.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.3008837114448693, "Regression_eta": 0.0010277300520220212, "Regression_sin_phi": 0.0005806082438696268, "Regression_cos_phi": 0.0005822392219471366, "Regression_energy": 0.34748910205258665, "Classification_binary": 3.1040650282052904, "Classification": 0.040099416766000776, "ispu": 0.058651585164965395, "MET": 24.15997416490219, "Sliced_Wasserstein_Loss": 136.58896122365135, "Total": 3.853378413077142}, "valid": {"Regression_pt": 0.29453597866227604, "Regression_eta": 0.0010673589538253072, "Regression_sin_phi": 0.0005911822611968265, "Regression_cos_phi": 0.0005926040252321002, "Regression_energy": 0.341474826018558, "Classification_binary": 3.1659934051478955, "Classification": 0.0402924990084391, "ispu": 0.07058737085405335, "MET": 24.798499271188852, "Sliced_Wasserstein_Loss": 140.04769269055745, "Total": 3.915133496871445}, "epoch_train_time": 20167.10527420044, "epoch_valid_time": 523.8193292617798, "epoch_total_time": 20690.92460513115, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/med": 1.0586366443631134, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/iqr": 0.41284306168634477, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/match_frac": 0.1960951353261521}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_6.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.29915671144684447, "Regression_eta": 0.0010262925634717788, "Regression_sin_phi": 0.0005799154790294753, "Regression_cos_phi": 0.0005815568247701284, "Regression_energy": 0.345743523202209, "Classification_binary": 3.095661214565623, "Classification": 0.040032978851710886, "ispu": 0.05820238277176232, "MET": 23.825565685933697, "Sliced_Wasserstein_Loss": 136.30262617324527, "Total": 3.8409852692538635}, "valid": {"Regression_pt": 0.2910126912851518, "Regression_eta": 0.0010557338781866739, "Regression_sin_phi": 0.0005897295759806454, "Regression_cos_phi": 0.0005914229174929674, "Regression_energy": 0.3379818999862237, "Classification_binary": 3.1455622511376564, "Classification": 0.040132090771428826, "ispu": 0.06920997003375196, "MET": 23.448378839590443, "Sliced_Wasserstein_Loss": 139.2403210324232, "Total": 3.886136589874858}, "epoch_train_time": 19725.950634002686, "epoch_valid_time": 466.2866563796997, "epoch_total_time": 20192.237290859222, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/med": 1.044025788854369, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/iqr": 0.3949686501767835, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/match_frac": 0.19607620417873528}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_7.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.2979130702288026, "Regression_eta": 0.0010253341574021357, "Regression_sin_phi": 0.0005795831110377765, "Regression_cos_phi": 0.0005812216237541985, "Regression_energy": 0.34448935808275133, "Classification_binary": 3.086900637581772, "Classification": 0.039961001229784236, "ispu": 0.05761859557331993, "MET": 23.28802578769396, "Sliced_Wasserstein_Loss": 136.08633821066272, "Total": 3.8290639418670795}, "valid": {"Regression_pt": 0.289853561453445, "Regression_eta": 0.0010497221496460517, "Regression_sin_phi": 0.0005894578628843826, "Regression_cos_phi": 0.0005905249148641159, "Regression_energy": 0.33739359468323377, "Classification_binary": 3.125193868209613, "Classification": 0.040057480674283635, "ispu": 0.06435159503125222, "MET": 24.003648499715585, "Sliced_Wasserstein_Loss": 137.53261874288964, "Total": 3.859078642722554}, "epoch_train_time": 19885.2097158432, "epoch_valid_time": 464.0820517539978, "epoch_total_time": 20349.291768312454, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/med": 1.0340979732246063, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/iqr": 0.39475386966068204, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/match_frac": 0.19663782821876835}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_8.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.29638917226953826, "Regression_eta": 0.001024053148232824, "Regression_sin_phi": 0.0005789030646681088, "Regression_cos_phi": 0.0005805300644562729, "Regression_energy": 0.3429501526305186, "Classification_binary": 3.0810462622064914, "Classification": 0.039926486073637926, "ispu": 0.05706106026239018, "MET": 22.824935609771515, "Sliced_Wasserstein_Loss": 135.85837309989572, "Total": 3.81955280393768}, "valid": {"Regression_pt": 0.28767507854717717, "Regression_eta": 0.0010383879772225338, "Regression_sin_phi": 0.0005877603849860181, "Regression_cos_phi": 0.0005892623677866722, "Regression_energy": 0.3350746059309229, "Classification_binary": 3.118374040102389, "Classification": 0.04010707607855162, "ispu": 0.06560502903995796, "MET": 22.4821041311149, "Sliced_Wasserstein_Loss": 137.08809726962457, "Total": 3.849050545719568}, "epoch_train_time": 19759.637872457504, "epoch_valid_time": 486.9554784297943, "epoch_total_time": 20246.593351602554, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/med": 1.0254536889917758, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/iqr": 0.3853243023961308, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/match_frac": 0.19533788942947833}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/history/epoch_9.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"train": {"Regression_pt": 0.29520074295657805, "Regression_eta": 0.0010230615897519667, "Regression_sin_phi": 0.0005784931803112804, "Regression_cos_phi": 0.0005800879318448998, "Regression_energy": 0.34173996569146414, "Classification_binary": 3.074905982365768, "Classification": 0.03988037070797649, "ispu": 0.056557402080189535, "MET": 22.240485652434977, "Sliced_Wasserstein_Loss": 135.66468097209494, "Total": 3.8104636096451032}, "valid": {"Regression_pt": 0.2866791604728829, "Regression_eta": 0.0010337590900026219, "Regression_sin_phi": 0.0005868364112775887, "Regression_cos_phi": 0.0005883360885515961, "Regression_energy": 0.33379224271633245, "Classification_binary": 3.0966746880332763, "Classification": 0.03988657876493174, "ispu": 0.060137621778676945, "MET": 22.687517775881684, "Sliced_Wasserstein_Loss": 136.82399210750853, "Total": 3.8193806549523606}, "epoch_train_time": 20148.605546474457, "epoch_valid_time": 495.0250635147095, "epoch_total_time": 20643.63061094284, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/med": 1.029867311652949, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/iqr": 0.3849996061325255, "epoch/cms_pf_qcd/jet_ratio/jet_ratio_target_to_pred_pt/match_frac": 0.19766642056175024}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/hyperparameters.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"num_mlpf_params": 5133603, "train": true, "test": null, "make_plots": null, "comet": false, "save_attention": false, "dataset": "cms", "sort_data": true, "data_dir": "/scratch/project_465001293/joosep/tensorflow_datasets", "gpus": 8, "gpu_batch_multiplier": 12, "load": "experiments/pyg-cms_20250721_111927_308632/checkpoints/checkpoint-08-3.849051.pth", "finetune": null, "num_epochs": 10, "patience": 20, "lr": 0.002, "lr_schedule": "cosinedecay", "conv_type": "attention", "ntrain": null, "ntest": 1000, "nvalid": null, "num_workers": 4, "prefetch_factor": 10, "checkpoint_freq": 1, "comet_name": "particleflow-pt", "comet_offline": false, "comet_step_freq": 10, "dtype": "bfloat16", "val_freq": null, "pad_to_multiple": 256, "model": {"trainable": "all", "learned_representation_mode": "last", "input_encoding": "split", "pt_mode": "direct-elemtype-split", "eta_mode": "linear", "sin_phi_mode": "linear", "cos_phi_mode": "linear", "energy_mode": "direct-elemtype-split", "gnn_lsh": {"conv_type": "gnn_lsh", "embedding_dim": 512, "width": 512, "num_convs": 8, "dropout_ff": 0.0, "activation": "elu", "bin_size": 320, "max_num_bins": 200, "distance_dim": 128, "layernorm": true, "num_node_messages": 2, "ffn_dist_hidden_dim": 128, "ffn_dist_num_layers": 2}, "attention": {"conv_type": "attention", "num_convs": 3, "dropout_ff": 0.0, "dropout_conv_id_mha": 0.0, "dropout_conv_id_ff": 0.0, "dropout_conv_reg_mha": 0.0, "dropout_conv_reg_ff": 0.0, "activation": "relu", "head_dim": 16, "num_heads": 16, "attention_type": "flash", "use_pre_layernorm": true}, "mamba": {"conv_type": "mamba", "embedding_dim": 1024, "width": 1024, "num_convs": 4, "dropout_ff": 0.0, "activation": "elu", "d_state": 32, "d_conv": 4, "expand": 2}}, "lr_schedule_config": {"onecycle": {"pct_start": 0.3}}, "raytune": {"local_dir": null, "sched": "asha", "search_alg": "hyperopt", "default_metric": "val_loss", "default_mode": "min", "asha": {"max_t": 200, "reduction_factor": 4, "brackets": 1, "grace_period": 10}, "hyperband": {"max_t": 200, "reduction_factor": 4}, "hyperopt": {"n_random_steps": 10}, "nevergrad": {"n_random_steps": 10}}, "train_dataset": {"cms": {"physical_pu": {"batch_size": 1, "samples": {"cms_pf_ttbar": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_qcd": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_ztt": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}}}, "physical_nopu": {"batch_size": 8, "samples": {"cms_pf_ttbar_nopu": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_qcd_nopu": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_ztt_nopu": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}}}}}, "valid_dataset": {"cms": {"physical_pu": {"batch_size": 1, "samples": {"cms_pf_ttbar": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_qcd": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_ztt": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}}}, "physical_nopu": {"batch_size": 8, "samples": {"cms_pf_ttbar_nopu": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_qcd_nopu": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_ztt_nopu": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}}}}}, "test_dataset": {"cms_pf_ttbar": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_qcd": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_ztt": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_ttbar_nopu": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_qcd_nopu": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}, "cms_pf_ztt_nopu": {"version": "2.7.1", "splits": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10]}}, "enabled_test_datasets": ["cms_pf_qcd"], "start_epoch": null}
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/model_kwargs.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e67fcae0627f6e53393e8e0fa2949bc8a5b1c1c58dfe79969dffa548562f600
|
3 |
+
size 565
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/train/events.out.tfevents.1752995498.nid006475.109881.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afcffb97de1476a19daf8630fd219d7b93801e971b7ccbb4304c95b7cae97cc8
|
3 |
+
size 638382
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/train/events.out.tfevents.1753086081.nid006574.78721.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:826393d4a8ce579b343679d22fb6313860379ae650dda31d00df64d4b1092c72
|
3 |
+
size 640538
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/train/events.out.tfevents.1753168805.nid005223.61027.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0af92882e8bbf9825eafe6a0ed47dc46be5f887b66691bcbc3d8150896275184
|
3 |
+
size 380747
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/valid/events.out.tfevents.1752995498.nid006475.109881.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a5cec49826a87f0f291bd04475bf0ff3dd4d64f622e770389a7343b35904b77
|
3 |
+
size 5846251
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/valid/events.out.tfevents.1753086081.nid006574.78721.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:952b20f3fc897398122758db2fc7b8eae1a48350402fc4542ba2bb2c62448038
|
3 |
+
size 5872263
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/runs/valid/events.out.tfevents.1753168805.nid005223.61027.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38131e617abc29ec34d51545114e06383608e0941018c335d1a70c5ef5486000
|
3 |
+
size 2767234
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/test-config.yaml
ADDED
@@ -0,0 +1,350 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
checkpoint_freq: 1
|
2 |
+
comet: false
|
3 |
+
comet_name: particleflow-pt
|
4 |
+
comet_offline: false
|
5 |
+
comet_step_freq: 10
|
6 |
+
conv_type: attention
|
7 |
+
data_dir: /scratch/persistent/joosep/tensorflow_datasets
|
8 |
+
dataset: cms
|
9 |
+
dtype: bfloat16
|
10 |
+
enabled_test_datasets:
|
11 |
+
- cms_pf_ttbar
|
12 |
+
finetune: null
|
13 |
+
gpu_batch_multiplier: 2
|
14 |
+
gpus: 1
|
15 |
+
load: experiments/pyg-cms_20250722_101813_274478/checkpoints/checkpoint-10-3.812332.pth
|
16 |
+
lr: 0.0002
|
17 |
+
lr_schedule: cosinedecay
|
18 |
+
lr_schedule_config:
|
19 |
+
onecycle:
|
20 |
+
pct_start: 0.3
|
21 |
+
make_plots: true
|
22 |
+
model:
|
23 |
+
attention:
|
24 |
+
activation: relu
|
25 |
+
attention_type: flash
|
26 |
+
conv_type: attention
|
27 |
+
dropout_conv_id_ff: 0.0
|
28 |
+
dropout_conv_id_mha: 0.0
|
29 |
+
dropout_conv_reg_ff: 0.0
|
30 |
+
dropout_conv_reg_mha: 0.0
|
31 |
+
dropout_ff: 0.0
|
32 |
+
head_dim: 16
|
33 |
+
num_convs: 3
|
34 |
+
num_heads: 16
|
35 |
+
use_pre_layernorm: true
|
36 |
+
cos_phi_mode: linear
|
37 |
+
energy_mode: direct-elemtype-split
|
38 |
+
eta_mode: linear
|
39 |
+
gnn_lsh:
|
40 |
+
activation: elu
|
41 |
+
bin_size: 320
|
42 |
+
conv_type: gnn_lsh
|
43 |
+
distance_dim: 128
|
44 |
+
dropout_ff: 0.0
|
45 |
+
embedding_dim: 512
|
46 |
+
ffn_dist_hidden_dim: 128
|
47 |
+
ffn_dist_num_layers: 2
|
48 |
+
layernorm: true
|
49 |
+
max_num_bins: 200
|
50 |
+
num_convs: 8
|
51 |
+
num_node_messages: 2
|
52 |
+
width: 512
|
53 |
+
input_encoding: split
|
54 |
+
learned_representation_mode: last
|
55 |
+
mamba:
|
56 |
+
activation: elu
|
57 |
+
conv_type: mamba
|
58 |
+
d_conv: 4
|
59 |
+
d_state: 32
|
60 |
+
dropout_ff: 0.0
|
61 |
+
embedding_dim: 1024
|
62 |
+
expand: 2
|
63 |
+
num_convs: 4
|
64 |
+
width: 1024
|
65 |
+
pt_mode: direct-elemtype-split
|
66 |
+
sin_phi_mode: linear
|
67 |
+
trainable: all
|
68 |
+
ntest: 5000
|
69 |
+
ntrain: null
|
70 |
+
num_epochs: 10
|
71 |
+
num_workers: 1
|
72 |
+
nvalid: null
|
73 |
+
pad_to_multiple: 256
|
74 |
+
patience: 20
|
75 |
+
prefetch_factor: 10
|
76 |
+
raytune:
|
77 |
+
asha:
|
78 |
+
brackets: 1
|
79 |
+
grace_period: 10
|
80 |
+
max_t: 200
|
81 |
+
reduction_factor: 4
|
82 |
+
default_metric: val_loss
|
83 |
+
default_mode: min
|
84 |
+
hyperband:
|
85 |
+
max_t: 200
|
86 |
+
reduction_factor: 4
|
87 |
+
hyperopt:
|
88 |
+
n_random_steps: 10
|
89 |
+
local_dir: null
|
90 |
+
nevergrad:
|
91 |
+
n_random_steps: 10
|
92 |
+
sched: asha
|
93 |
+
search_alg: hyperopt
|
94 |
+
save_attention: false
|
95 |
+
sort_data: true
|
96 |
+
start_epoch: null
|
97 |
+
test: true
|
98 |
+
test_dataset:
|
99 |
+
cms_pf_qcd:
|
100 |
+
splits:
|
101 |
+
- 1
|
102 |
+
- 2
|
103 |
+
- 3
|
104 |
+
- 4
|
105 |
+
- 5
|
106 |
+
- 6
|
107 |
+
- 7
|
108 |
+
- 8
|
109 |
+
- 9
|
110 |
+
- 10
|
111 |
+
version: 2.7.1
|
112 |
+
cms_pf_qcd_nopu:
|
113 |
+
splits:
|
114 |
+
- 1
|
115 |
+
- 2
|
116 |
+
- 3
|
117 |
+
- 4
|
118 |
+
- 5
|
119 |
+
- 6
|
120 |
+
- 7
|
121 |
+
- 8
|
122 |
+
- 9
|
123 |
+
- 10
|
124 |
+
version: 2.7.1
|
125 |
+
cms_pf_ttbar:
|
126 |
+
splits:
|
127 |
+
- 1
|
128 |
+
- 2
|
129 |
+
- 3
|
130 |
+
- 4
|
131 |
+
- 5
|
132 |
+
- 6
|
133 |
+
- 7
|
134 |
+
- 8
|
135 |
+
- 9
|
136 |
+
- 10
|
137 |
+
version: 2.7.1
|
138 |
+
cms_pf_ttbar_nopu:
|
139 |
+
splits:
|
140 |
+
- 1
|
141 |
+
- 2
|
142 |
+
- 3
|
143 |
+
- 4
|
144 |
+
- 5
|
145 |
+
- 6
|
146 |
+
- 7
|
147 |
+
- 8
|
148 |
+
- 9
|
149 |
+
- 10
|
150 |
+
version: 2.7.1
|
151 |
+
cms_pf_ztt:
|
152 |
+
splits:
|
153 |
+
- 1
|
154 |
+
- 2
|
155 |
+
- 3
|
156 |
+
- 4
|
157 |
+
- 5
|
158 |
+
- 6
|
159 |
+
- 7
|
160 |
+
- 8
|
161 |
+
- 9
|
162 |
+
- 10
|
163 |
+
version: 2.7.1
|
164 |
+
cms_pf_ztt_nopu:
|
165 |
+
splits:
|
166 |
+
- 1
|
167 |
+
- 2
|
168 |
+
- 3
|
169 |
+
- 4
|
170 |
+
- 5
|
171 |
+
- 6
|
172 |
+
- 7
|
173 |
+
- 8
|
174 |
+
- 9
|
175 |
+
- 10
|
176 |
+
version: 2.7.1
|
177 |
+
train: null
|
178 |
+
train_dataset:
|
179 |
+
cms:
|
180 |
+
physical_nopu:
|
181 |
+
batch_size: 8
|
182 |
+
samples:
|
183 |
+
cms_pf_qcd_nopu:
|
184 |
+
splits:
|
185 |
+
- 1
|
186 |
+
- 2
|
187 |
+
- 3
|
188 |
+
- 4
|
189 |
+
- 5
|
190 |
+
- 6
|
191 |
+
- 7
|
192 |
+
- 8
|
193 |
+
- 9
|
194 |
+
- 10
|
195 |
+
version: 2.7.1
|
196 |
+
cms_pf_ttbar_nopu:
|
197 |
+
splits:
|
198 |
+
- 1
|
199 |
+
- 2
|
200 |
+
- 3
|
201 |
+
- 4
|
202 |
+
- 5
|
203 |
+
- 6
|
204 |
+
- 7
|
205 |
+
- 8
|
206 |
+
- 9
|
207 |
+
- 10
|
208 |
+
version: 2.7.1
|
209 |
+
cms_pf_ztt_nopu:
|
210 |
+
splits:
|
211 |
+
- 1
|
212 |
+
- 2
|
213 |
+
- 3
|
214 |
+
- 4
|
215 |
+
- 5
|
216 |
+
- 6
|
217 |
+
- 7
|
218 |
+
- 8
|
219 |
+
- 9
|
220 |
+
- 10
|
221 |
+
version: 2.7.1
|
222 |
+
physical_pu:
|
223 |
+
batch_size: 1
|
224 |
+
samples:
|
225 |
+
cms_pf_qcd:
|
226 |
+
splits:
|
227 |
+
- 1
|
228 |
+
- 2
|
229 |
+
- 3
|
230 |
+
- 4
|
231 |
+
- 5
|
232 |
+
- 6
|
233 |
+
- 7
|
234 |
+
- 8
|
235 |
+
- 9
|
236 |
+
- 10
|
237 |
+
version: 2.7.1
|
238 |
+
cms_pf_ttbar:
|
239 |
+
splits:
|
240 |
+
- 1
|
241 |
+
- 2
|
242 |
+
- 3
|
243 |
+
- 4
|
244 |
+
- 5
|
245 |
+
- 6
|
246 |
+
- 7
|
247 |
+
- 8
|
248 |
+
- 9
|
249 |
+
- 10
|
250 |
+
version: 2.7.1
|
251 |
+
cms_pf_ztt:
|
252 |
+
splits:
|
253 |
+
- 1
|
254 |
+
- 2
|
255 |
+
- 3
|
256 |
+
- 4
|
257 |
+
- 5
|
258 |
+
- 6
|
259 |
+
- 7
|
260 |
+
- 8
|
261 |
+
- 9
|
262 |
+
- 10
|
263 |
+
version: 2.7.1
|
264 |
+
val_freq: null
|
265 |
+
valid_dataset:
|
266 |
+
cms:
|
267 |
+
physical_nopu:
|
268 |
+
batch_size: 8
|
269 |
+
samples:
|
270 |
+
cms_pf_qcd_nopu:
|
271 |
+
splits:
|
272 |
+
- 1
|
273 |
+
- 2
|
274 |
+
- 3
|
275 |
+
- 4
|
276 |
+
- 5
|
277 |
+
- 6
|
278 |
+
- 7
|
279 |
+
- 8
|
280 |
+
- 9
|
281 |
+
- 10
|
282 |
+
version: 2.7.1
|
283 |
+
cms_pf_ttbar_nopu:
|
284 |
+
splits:
|
285 |
+
- 1
|
286 |
+
- 2
|
287 |
+
- 3
|
288 |
+
- 4
|
289 |
+
- 5
|
290 |
+
- 6
|
291 |
+
- 7
|
292 |
+
- 8
|
293 |
+
- 9
|
294 |
+
- 10
|
295 |
+
version: 2.7.1
|
296 |
+
cms_pf_ztt_nopu:
|
297 |
+
splits:
|
298 |
+
- 1
|
299 |
+
- 2
|
300 |
+
- 3
|
301 |
+
- 4
|
302 |
+
- 5
|
303 |
+
- 6
|
304 |
+
- 7
|
305 |
+
- 8
|
306 |
+
- 9
|
307 |
+
- 10
|
308 |
+
version: 2.7.1
|
309 |
+
physical_pu:
|
310 |
+
batch_size: 1
|
311 |
+
samples:
|
312 |
+
cms_pf_qcd:
|
313 |
+
splits:
|
314 |
+
- 1
|
315 |
+
- 2
|
316 |
+
- 3
|
317 |
+
- 4
|
318 |
+
- 5
|
319 |
+
- 6
|
320 |
+
- 7
|
321 |
+
- 8
|
322 |
+
- 9
|
323 |
+
- 10
|
324 |
+
version: 2.7.1
|
325 |
+
cms_pf_ttbar:
|
326 |
+
splits:
|
327 |
+
- 1
|
328 |
+
- 2
|
329 |
+
- 3
|
330 |
+
- 4
|
331 |
+
- 5
|
332 |
+
- 6
|
333 |
+
- 7
|
334 |
+
- 8
|
335 |
+
- 9
|
336 |
+
- 10
|
337 |
+
version: 2.7.1
|
338 |
+
cms_pf_ztt:
|
339 |
+
splits:
|
340 |
+
- 1
|
341 |
+
- 2
|
342 |
+
- 3
|
343 |
+
- 4
|
344 |
+
- 5
|
345 |
+
- 6
|
346 |
+
- 7
|
347 |
+
- 8
|
348 |
+
- 9
|
349 |
+
- 10
|
350 |
+
version: 2.7.1
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/test.log
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b2e5114f18e6b371655aa34bf391c52d7636c78f838bb858815aa31bead4381
|
3 |
+
size 2709546
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/train-config.yaml
ADDED
@@ -0,0 +1,350 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
checkpoint_freq: 1
|
2 |
+
comet: false
|
3 |
+
comet_name: particleflow-pt
|
4 |
+
comet_offline: false
|
5 |
+
comet_step_freq: 10
|
6 |
+
conv_type: attention
|
7 |
+
data_dir: /scratch/project_465001293/joosep/tensorflow_datasets
|
8 |
+
dataset: cms
|
9 |
+
dtype: bfloat16
|
10 |
+
enabled_test_datasets:
|
11 |
+
- cms_pf_qcd
|
12 |
+
finetune: null
|
13 |
+
gpu_batch_multiplier: 12
|
14 |
+
gpus: 8
|
15 |
+
load: experiments/pyg-cms_20250721_111927_308632/checkpoints/checkpoint-08-3.849051.pth
|
16 |
+
lr: 0.002
|
17 |
+
lr_schedule: cosinedecay
|
18 |
+
lr_schedule_config:
|
19 |
+
onecycle:
|
20 |
+
pct_start: 0.3
|
21 |
+
make_plots: null
|
22 |
+
model:
|
23 |
+
attention:
|
24 |
+
activation: relu
|
25 |
+
attention_type: flash
|
26 |
+
conv_type: attention
|
27 |
+
dropout_conv_id_ff: 0.0
|
28 |
+
dropout_conv_id_mha: 0.0
|
29 |
+
dropout_conv_reg_ff: 0.0
|
30 |
+
dropout_conv_reg_mha: 0.0
|
31 |
+
dropout_ff: 0.0
|
32 |
+
head_dim: 16
|
33 |
+
num_convs: 3
|
34 |
+
num_heads: 16
|
35 |
+
use_pre_layernorm: true
|
36 |
+
cos_phi_mode: linear
|
37 |
+
energy_mode: direct-elemtype-split
|
38 |
+
eta_mode: linear
|
39 |
+
gnn_lsh:
|
40 |
+
activation: elu
|
41 |
+
bin_size: 320
|
42 |
+
conv_type: gnn_lsh
|
43 |
+
distance_dim: 128
|
44 |
+
dropout_ff: 0.0
|
45 |
+
embedding_dim: 512
|
46 |
+
ffn_dist_hidden_dim: 128
|
47 |
+
ffn_dist_num_layers: 2
|
48 |
+
layernorm: true
|
49 |
+
max_num_bins: 200
|
50 |
+
num_convs: 8
|
51 |
+
num_node_messages: 2
|
52 |
+
width: 512
|
53 |
+
input_encoding: split
|
54 |
+
learned_representation_mode: last
|
55 |
+
mamba:
|
56 |
+
activation: elu
|
57 |
+
conv_type: mamba
|
58 |
+
d_conv: 4
|
59 |
+
d_state: 32
|
60 |
+
dropout_ff: 0.0
|
61 |
+
embedding_dim: 1024
|
62 |
+
expand: 2
|
63 |
+
num_convs: 4
|
64 |
+
width: 1024
|
65 |
+
pt_mode: direct-elemtype-split
|
66 |
+
sin_phi_mode: linear
|
67 |
+
trainable: all
|
68 |
+
ntest: 1000
|
69 |
+
ntrain: null
|
70 |
+
num_epochs: 10
|
71 |
+
num_workers: 4
|
72 |
+
nvalid: null
|
73 |
+
pad_to_multiple: 256
|
74 |
+
patience: 20
|
75 |
+
prefetch_factor: 10
|
76 |
+
raytune:
|
77 |
+
asha:
|
78 |
+
brackets: 1
|
79 |
+
grace_period: 10
|
80 |
+
max_t: 200
|
81 |
+
reduction_factor: 4
|
82 |
+
default_metric: val_loss
|
83 |
+
default_mode: min
|
84 |
+
hyperband:
|
85 |
+
max_t: 200
|
86 |
+
reduction_factor: 4
|
87 |
+
hyperopt:
|
88 |
+
n_random_steps: 10
|
89 |
+
local_dir: null
|
90 |
+
nevergrad:
|
91 |
+
n_random_steps: 10
|
92 |
+
sched: asha
|
93 |
+
search_alg: hyperopt
|
94 |
+
save_attention: false
|
95 |
+
sort_data: true
|
96 |
+
start_epoch: null
|
97 |
+
test: null
|
98 |
+
test_dataset:
|
99 |
+
cms_pf_qcd:
|
100 |
+
splits:
|
101 |
+
- 1
|
102 |
+
- 2
|
103 |
+
- 3
|
104 |
+
- 4
|
105 |
+
- 5
|
106 |
+
- 6
|
107 |
+
- 7
|
108 |
+
- 8
|
109 |
+
- 9
|
110 |
+
- 10
|
111 |
+
version: 2.7.1
|
112 |
+
cms_pf_qcd_nopu:
|
113 |
+
splits:
|
114 |
+
- 1
|
115 |
+
- 2
|
116 |
+
- 3
|
117 |
+
- 4
|
118 |
+
- 5
|
119 |
+
- 6
|
120 |
+
- 7
|
121 |
+
- 8
|
122 |
+
- 9
|
123 |
+
- 10
|
124 |
+
version: 2.7.1
|
125 |
+
cms_pf_ttbar:
|
126 |
+
splits:
|
127 |
+
- 1
|
128 |
+
- 2
|
129 |
+
- 3
|
130 |
+
- 4
|
131 |
+
- 5
|
132 |
+
- 6
|
133 |
+
- 7
|
134 |
+
- 8
|
135 |
+
- 9
|
136 |
+
- 10
|
137 |
+
version: 2.7.1
|
138 |
+
cms_pf_ttbar_nopu:
|
139 |
+
splits:
|
140 |
+
- 1
|
141 |
+
- 2
|
142 |
+
- 3
|
143 |
+
- 4
|
144 |
+
- 5
|
145 |
+
- 6
|
146 |
+
- 7
|
147 |
+
- 8
|
148 |
+
- 9
|
149 |
+
- 10
|
150 |
+
version: 2.7.1
|
151 |
+
cms_pf_ztt:
|
152 |
+
splits:
|
153 |
+
- 1
|
154 |
+
- 2
|
155 |
+
- 3
|
156 |
+
- 4
|
157 |
+
- 5
|
158 |
+
- 6
|
159 |
+
- 7
|
160 |
+
- 8
|
161 |
+
- 9
|
162 |
+
- 10
|
163 |
+
version: 2.7.1
|
164 |
+
cms_pf_ztt_nopu:
|
165 |
+
splits:
|
166 |
+
- 1
|
167 |
+
- 2
|
168 |
+
- 3
|
169 |
+
- 4
|
170 |
+
- 5
|
171 |
+
- 6
|
172 |
+
- 7
|
173 |
+
- 8
|
174 |
+
- 9
|
175 |
+
- 10
|
176 |
+
version: 2.7.1
|
177 |
+
train: true
|
178 |
+
train_dataset:
|
179 |
+
cms:
|
180 |
+
physical_nopu:
|
181 |
+
batch_size: 8
|
182 |
+
samples:
|
183 |
+
cms_pf_qcd_nopu:
|
184 |
+
splits:
|
185 |
+
- 1
|
186 |
+
- 2
|
187 |
+
- 3
|
188 |
+
- 4
|
189 |
+
- 5
|
190 |
+
- 6
|
191 |
+
- 7
|
192 |
+
- 8
|
193 |
+
- 9
|
194 |
+
- 10
|
195 |
+
version: 2.7.1
|
196 |
+
cms_pf_ttbar_nopu:
|
197 |
+
splits:
|
198 |
+
- 1
|
199 |
+
- 2
|
200 |
+
- 3
|
201 |
+
- 4
|
202 |
+
- 5
|
203 |
+
- 6
|
204 |
+
- 7
|
205 |
+
- 8
|
206 |
+
- 9
|
207 |
+
- 10
|
208 |
+
version: 2.7.1
|
209 |
+
cms_pf_ztt_nopu:
|
210 |
+
splits:
|
211 |
+
- 1
|
212 |
+
- 2
|
213 |
+
- 3
|
214 |
+
- 4
|
215 |
+
- 5
|
216 |
+
- 6
|
217 |
+
- 7
|
218 |
+
- 8
|
219 |
+
- 9
|
220 |
+
- 10
|
221 |
+
version: 2.7.1
|
222 |
+
physical_pu:
|
223 |
+
batch_size: 1
|
224 |
+
samples:
|
225 |
+
cms_pf_qcd:
|
226 |
+
splits:
|
227 |
+
- 1
|
228 |
+
- 2
|
229 |
+
- 3
|
230 |
+
- 4
|
231 |
+
- 5
|
232 |
+
- 6
|
233 |
+
- 7
|
234 |
+
- 8
|
235 |
+
- 9
|
236 |
+
- 10
|
237 |
+
version: 2.7.1
|
238 |
+
cms_pf_ttbar:
|
239 |
+
splits:
|
240 |
+
- 1
|
241 |
+
- 2
|
242 |
+
- 3
|
243 |
+
- 4
|
244 |
+
- 5
|
245 |
+
- 6
|
246 |
+
- 7
|
247 |
+
- 8
|
248 |
+
- 9
|
249 |
+
- 10
|
250 |
+
version: 2.7.1
|
251 |
+
cms_pf_ztt:
|
252 |
+
splits:
|
253 |
+
- 1
|
254 |
+
- 2
|
255 |
+
- 3
|
256 |
+
- 4
|
257 |
+
- 5
|
258 |
+
- 6
|
259 |
+
- 7
|
260 |
+
- 8
|
261 |
+
- 9
|
262 |
+
- 10
|
263 |
+
version: 2.7.1
|
264 |
+
val_freq: null
|
265 |
+
valid_dataset:
|
266 |
+
cms:
|
267 |
+
physical_nopu:
|
268 |
+
batch_size: 8
|
269 |
+
samples:
|
270 |
+
cms_pf_qcd_nopu:
|
271 |
+
splits:
|
272 |
+
- 1
|
273 |
+
- 2
|
274 |
+
- 3
|
275 |
+
- 4
|
276 |
+
- 5
|
277 |
+
- 6
|
278 |
+
- 7
|
279 |
+
- 8
|
280 |
+
- 9
|
281 |
+
- 10
|
282 |
+
version: 2.7.1
|
283 |
+
cms_pf_ttbar_nopu:
|
284 |
+
splits:
|
285 |
+
- 1
|
286 |
+
- 2
|
287 |
+
- 3
|
288 |
+
- 4
|
289 |
+
- 5
|
290 |
+
- 6
|
291 |
+
- 7
|
292 |
+
- 8
|
293 |
+
- 9
|
294 |
+
- 10
|
295 |
+
version: 2.7.1
|
296 |
+
cms_pf_ztt_nopu:
|
297 |
+
splits:
|
298 |
+
- 1
|
299 |
+
- 2
|
300 |
+
- 3
|
301 |
+
- 4
|
302 |
+
- 5
|
303 |
+
- 6
|
304 |
+
- 7
|
305 |
+
- 8
|
306 |
+
- 9
|
307 |
+
- 10
|
308 |
+
version: 2.7.1
|
309 |
+
physical_pu:
|
310 |
+
batch_size: 1
|
311 |
+
samples:
|
312 |
+
cms_pf_qcd:
|
313 |
+
splits:
|
314 |
+
- 1
|
315 |
+
- 2
|
316 |
+
- 3
|
317 |
+
- 4
|
318 |
+
- 5
|
319 |
+
- 6
|
320 |
+
- 7
|
321 |
+
- 8
|
322 |
+
- 9
|
323 |
+
- 10
|
324 |
+
version: 2.7.1
|
325 |
+
cms_pf_ttbar:
|
326 |
+
splits:
|
327 |
+
- 1
|
328 |
+
- 2
|
329 |
+
- 3
|
330 |
+
- 4
|
331 |
+
- 5
|
332 |
+
- 6
|
333 |
+
- 7
|
334 |
+
- 8
|
335 |
+
- 9
|
336 |
+
- 10
|
337 |
+
version: 2.7.1
|
338 |
+
cms_pf_ztt:
|
339 |
+
splits:
|
340 |
+
- 1
|
341 |
+
- 2
|
342 |
+
- 3
|
343 |
+
- 4
|
344 |
+
- 5
|
345 |
+
- 6
|
346 |
+
- 7
|
347 |
+
- 8
|
348 |
+
- 9
|
349 |
+
- 10
|
350 |
+
version: 2.7.1
|
cms/v2.6.0pre1/pyg-cms_20250722_101813_274478/train.log
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97a7c8fc9d73e3e1682b906b6f5cb48d2c0ea60e812e3961e6f3499c743f0407
|
3 |
+
size 45724
|