diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round10.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..edbd08b8677ca3b7845a0d234b093b7fe22eab2d --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c80aea373e684b0b0e1fdaa29f5086d9850282713d9fb54a967bdaf0d5656b +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round12.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..f8d6afd366582291fd73ef2dfa8f59939d048e65 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6e88b9022098d98fa9cfa027d936d0d4b833d12ba6a0b477a40df90c1a2acc6 +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round15.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..e56f0b4b4a7aa550a78ac385c15fe56f2a357d2c --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd38f4d921820662348aedb4fbadfbfbf98c971a9e60ab0866e5270c3a302ee4 +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round17.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea9444ed86d003a649da66a2ae335cf5ca2859fe --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a5f6b6de4aaf9d17c11baf939132bea16b62f9038995958983f45f6e4dd84db +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round2.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..8869f1066f2f129ecfe8a00697164c07255e153c --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b343498a2a39af749f7cbbad7c8ee7a9cfdfcc0a6849b2024c3c2ee452f5c30e +size 184220842 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round20.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..bbcecf8b9a017aaa9e535ffc9834b4976e6a43ba --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f76a291a929057829ffce7c02c24512babfad8e0d70ee53c39fd9a1d6225fb +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round5.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..a9927d36e27709d1a250c72bde3aa81a07abf58a --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfa4e7135faf8d522fa123c083db3cdf90c7510216734f3610f2ab72757f9f9 +size 184220842 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round7.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..892aa6c381d4c3d4b2b08c36dff4f9dbcb955c6c --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f14762c67038e79e68c786be9fa97f0a65e97fcde6d3a08aec4a845cc8761c7 +size 184220842 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_trainer_state.json b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..5b3e1caa27218d2ebbd283177f23d42e6b088a74 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/0_trainer_state.json @@ -0,0 +1,392 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "grad_norm": 10.118582725524902, + "learning_rate": 2e-05, + "loss": 1.2595, + "step": 2 + }, + { + "epoch": 0.04, + "grad_norm": 6.118746280670166, + "learning_rate": 2e-05, + "loss": 1.1929, + "step": 4 + }, + { + "epoch": 0.06, + "grad_norm": 6.284697532653809, + "learning_rate": 2e-05, + "loss": 0.2971, + "step": 6 + }, + { + "epoch": 0.08, + "grad_norm": 0.7177035808563232, + "learning_rate": 2e-05, + "loss": 0.0715, + "step": 8 + }, + { + "epoch": 0.1, + "grad_norm": 4.433117866516113, + "learning_rate": 2e-05, + "loss": 0.5271, + "step": 10 + }, + { + "epoch": 0.12, + "grad_norm": 11.228690147399902, + "learning_rate": 2e-05, + "loss": 0.7939, + "step": 12 + }, + { + "epoch": 0.14, + "grad_norm": 5.912347793579102, + "learning_rate": 2e-05, + "loss": 0.3741, + "step": 14 + }, + { + "epoch": 0.16, + "grad_norm": 10.805156707763672, + "learning_rate": 2e-05, + "loss": 1.2708, + "step": 16 + }, + { + "epoch": 0.18, + "grad_norm": 15.403585433959961, + "learning_rate": 2e-05, + "loss": 1.6731, + "step": 18 + }, + { + "epoch": 0.2, + "grad_norm": 9.482099533081055, + "learning_rate": 2e-05, + "loss": 0.9167, + "step": 20 + }, + { + "epoch": 0.22, + "grad_norm": 0.6143919229507446, + "learning_rate": 2e-05, + "loss": 0.019, + "step": 22 + }, + { + "epoch": 0.24, + "grad_norm": 10.184311866760254, + "learning_rate": 2e-05, + "loss": 0.8106, + "step": 24 + }, + { + "epoch": 0.26, + "grad_norm": 6.651106834411621, + "learning_rate": 2e-05, + "loss": 0.2174, + "step": 26 + }, + { + "epoch": 0.28, + "grad_norm": 0.7003784775733948, + "learning_rate": 2e-05, + "loss": 0.1429, + "step": 28 + }, + { + "epoch": 0.3, + "grad_norm": 2.259704351425171, + "learning_rate": 2e-05, + "loss": 0.7785, + "step": 30 + }, + { + "epoch": 0.32, + "grad_norm": 18.155855178833008, + "learning_rate": 2e-05, + "loss": 1.0938, + "step": 32 + }, + { + "epoch": 0.34, + "grad_norm": 5.880727291107178, + "learning_rate": 2e-05, + "loss": 0.276, + "step": 34 + }, + { + "epoch": 0.36, + "grad_norm": 11.953298568725586, + "learning_rate": 2e-05, + "loss": 0.6074, + "step": 36 + }, + { + "epoch": 0.38, + "grad_norm": 4.191051483154297, + "learning_rate": 2e-05, + "loss": 0.8617, + "step": 38 + }, + { + "epoch": 0.4, + "grad_norm": 4.7227277755737305, + "learning_rate": 2e-05, + "loss": 0.2521, + "step": 40 + }, + { + "epoch": 0.42, + "grad_norm": 1.4572652578353882, + "learning_rate": 2e-05, + "loss": 0.0813, + "step": 42 + }, + { + "epoch": 0.44, + "grad_norm": 7.992749214172363, + "learning_rate": 2e-05, + "loss": 1.4219, + "step": 44 + }, + { + "epoch": 0.46, + "grad_norm": 0.41965484619140625, + "learning_rate": 2e-05, + "loss": 0.2991, + "step": 46 + }, + { + "epoch": 0.48, + "grad_norm": 15.168863296508789, + "learning_rate": 2e-05, + "loss": 1.431, + "step": 48 + }, + { + "epoch": 0.5, + "grad_norm": 2.7082669734954834, + "learning_rate": 2e-05, + "loss": 0.1486, + "step": 50 + }, + { + "epoch": 0.52, + "grad_norm": 10.389884948730469, + "learning_rate": 2e-05, + "loss": 0.4073, + "step": 52 + }, + { + "epoch": 0.54, + "grad_norm": 2.2888519763946533, + "learning_rate": 2e-05, + "loss": 0.167, + "step": 54 + }, + { + "epoch": 0.56, + "grad_norm": 3.7965214252471924, + "learning_rate": 2e-05, + "loss": 0.153, + "step": 56 + }, + { + "epoch": 0.58, + "grad_norm": 12.314504623413086, + "learning_rate": 2e-05, + "loss": 1.9982, + "step": 58 + }, + { + "epoch": 0.6, + "grad_norm": 4.840147495269775, + "learning_rate": 2e-05, + "loss": 0.1507, + "step": 60 + }, + { + "epoch": 0.62, + "grad_norm": 2.2985310554504395, + "learning_rate": 2e-05, + "loss": 0.3894, + "step": 62 + }, + { + "epoch": 0.64, + "grad_norm": 3.943399667739868, + "learning_rate": 2e-05, + "loss": 0.1996, + "step": 64 + }, + { + "epoch": 0.66, + "grad_norm": 0.6128279566764832, + "learning_rate": 2e-05, + "loss": 0.1911, + "step": 66 + }, + { + "epoch": 0.68, + "grad_norm": 8.006756782531738, + "learning_rate": 2e-05, + "loss": 0.7514, + "step": 68 + }, + { + "epoch": 0.7, + "grad_norm": 12.730741500854492, + "learning_rate": 2e-05, + "loss": 0.7592, + "step": 70 + }, + { + "epoch": 0.72, + "grad_norm": 7.818113327026367, + "learning_rate": 2e-05, + "loss": 0.3167, + "step": 72 + }, + { + "epoch": 0.74, + "grad_norm": 11.865202903747559, + "learning_rate": 2e-05, + "loss": 2.6763, + "step": 74 + }, + { + "epoch": 0.76, + "grad_norm": 5.829477310180664, + "learning_rate": 2e-05, + "loss": 0.7548, + "step": 76 + }, + { + "epoch": 0.78, + "grad_norm": 0.4222329258918762, + "learning_rate": 2e-05, + "loss": 0.9183, + "step": 78 + }, + { + "epoch": 0.8, + "grad_norm": 6.740832805633545, + "learning_rate": 2e-05, + "loss": 1.1974, + "step": 80 + }, + { + "epoch": 0.82, + "grad_norm": 6.7113728523254395, + "learning_rate": 2e-05, + "loss": 0.5823, + "step": 82 + }, + { + "epoch": 0.84, + "grad_norm": 13.459867477416992, + "learning_rate": 2e-05, + "loss": 0.947, + "step": 84 + }, + { + "epoch": 0.86, + "grad_norm": 0.5863717198371887, + "learning_rate": 2e-05, + "loss": 0.1598, + "step": 86 + }, + { + "epoch": 0.88, + "grad_norm": 9.321941375732422, + "learning_rate": 2e-05, + "loss": 1.2366, + "step": 88 + }, + { + "epoch": 0.9, + "grad_norm": 4.117404937744141, + "learning_rate": 2e-05, + "loss": 0.403, + "step": 90 + }, + { + "epoch": 0.92, + "grad_norm": 0.7923697233200073, + "learning_rate": 2e-05, + "loss": 0.8784, + "step": 92 + }, + { + "epoch": 0.94, + "grad_norm": 9.964466094970703, + "learning_rate": 2e-05, + "loss": 1.9698, + "step": 94 + }, + { + "epoch": 0.96, + "grad_norm": 3.3292384147644043, + "learning_rate": 2e-05, + "loss": 1.5952, + "step": 96 + }, + { + "epoch": 0.98, + "grad_norm": 12.358708381652832, + "learning_rate": 2e-05, + "loss": 1.8824, + "step": 98 + }, + { + "epoch": 1.0, + "grad_norm": 0.8694202899932861, + "learning_rate": 2e-05, + "loss": 0.2218, + "step": 100 + }, + { + "epoch": 1.0, + "step": 100, + "total_flos": 2053257199353856.0, + "train_loss": 0.7544884479045868, + "train_runtime": 104.185, + "train_samples_per_second": 3.839, + "train_steps_per_second": 0.96 + } + ], + "logging_steps": 2, + "max_steps": 100, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2053257199353856.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round10.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..d5083d0dfb4694e0d5e31eb7dbf724c5f38d5bee --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f0ac16fec9edf041d389c5bc6dd315670e98dca7a8355c19ee4a1b791eb6135 +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round12.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..e9786a655c3b65821362af49c1f85c50745c90ce --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d4855863c1d2f4eea6cf30aa47ef34f4c334618724ad7e2894e05f243c9d09 +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round15.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..b5f55507290884746396e278000af1fe3cd6ec18 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbfe4d0a3f072b16da77d77359969da3ec9dac57bd6ba9c87781fe28237622dc +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round17.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..e46ff9cada27e1d03d096fc20cbe7216c691bd44 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed405c45843666cf944afa281a4b30b27575cff4f34767d3efb7ce3168ca8674 +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round2.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..732ce75da7391b91ff2243b3a1f291d014b9065b --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7947d130f5da524a4b3c4cdb5fc89c08bfdeeb3cbf9a84c3a983ad0ec461c06d +size 184220842 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round20.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..edb28cf8d3da2d4fb5717ef2da73350ae99dc182 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d028fff214c7d648c71a7a3c6aeac247aa071eae5fecee83d7f4cd501f25715 +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round5.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..949ee1bb98b1632ab169d67bc3d301e9077d2881 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a233ae029e545a60633b16cd949410fa1d06d79f6799baaa3bb71f1ddc81bdc +size 184220842 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round7.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..b28f80b382109765a3e2c797785cf58b0be9e9dc --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db6e06c7046e40a00de81a16c30f86bbc0efdb7a8a04ac38e98f85de5211b06 +size 184220842 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_trainer_state.json b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..3e859b067b2c8b769942351d5bc7bcccf9d0d9a4 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/1_trainer_state.json @@ -0,0 +1,392 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "grad_norm": 0.04393099993467331, + "learning_rate": 2e-05, + "loss": 0.1207, + "step": 2 + }, + { + "epoch": 0.04, + "grad_norm": 0.05937394127249718, + "learning_rate": 2e-05, + "loss": 0.0377, + "step": 4 + }, + { + "epoch": 0.06, + "grad_norm": 0.35762932896614075, + "learning_rate": 2e-05, + "loss": 0.0098, + "step": 6 + }, + { + "epoch": 0.08, + "grad_norm": 0.09789979457855225, + "learning_rate": 2e-05, + "loss": 0.0068, + "step": 8 + }, + { + "epoch": 0.1, + "grad_norm": 0.03392194211483002, + "learning_rate": 2e-05, + "loss": 0.0019, + "step": 10 + }, + { + "epoch": 0.12, + "grad_norm": 0.023007916286587715, + "learning_rate": 2e-05, + "loss": 0.0066, + "step": 12 + }, + { + "epoch": 0.14, + "grad_norm": 0.07225459069013596, + "learning_rate": 2e-05, + "loss": 0.0019, + "step": 14 + }, + { + "epoch": 0.16, + "grad_norm": 0.3029000461101532, + "learning_rate": 2e-05, + "loss": 0.0827, + "step": 16 + }, + { + "epoch": 0.18, + "grad_norm": 0.025219613686203957, + "learning_rate": 2e-05, + "loss": 0.0294, + "step": 18 + }, + { + "epoch": 0.2, + "grad_norm": 0.011582453735172749, + "learning_rate": 2e-05, + "loss": 0.001, + "step": 20 + }, + { + "epoch": 0.22, + "grad_norm": 0.04991193488240242, + "learning_rate": 2e-05, + "loss": 0.0077, + "step": 22 + }, + { + "epoch": 0.24, + "grad_norm": 0.05845927447080612, + "learning_rate": 2e-05, + "loss": 0.0019, + "step": 24 + }, + { + "epoch": 0.26, + "grad_norm": 1.4130098819732666, + "learning_rate": 2e-05, + "loss": 0.0395, + "step": 26 + }, + { + "epoch": 0.28, + "grad_norm": 0.016544118523597717, + "learning_rate": 2e-05, + "loss": 0.0007, + "step": 28 + }, + { + "epoch": 0.3, + "grad_norm": 1.08310067653656, + "learning_rate": 2e-05, + "loss": 0.0187, + "step": 30 + }, + { + "epoch": 0.32, + "grad_norm": 0.4315275549888611, + "learning_rate": 2e-05, + "loss": 0.2183, + "step": 32 + }, + { + "epoch": 0.34, + "grad_norm": 5.541749954223633, + "learning_rate": 2e-05, + "loss": 0.1588, + "step": 34 + }, + { + "epoch": 0.36, + "grad_norm": 0.005985849536955357, + "learning_rate": 2e-05, + "loss": 0.0003, + "step": 36 + }, + { + "epoch": 0.38, + "grad_norm": 0.15569433569908142, + "learning_rate": 2e-05, + "loss": 0.0049, + "step": 38 + }, + { + "epoch": 0.4, + "grad_norm": 6.249331474304199, + "learning_rate": 2e-05, + "loss": 0.2083, + "step": 40 + }, + { + "epoch": 0.42, + "grad_norm": 0.013107839040458202, + "learning_rate": 2e-05, + "loss": 0.0005, + "step": 42 + }, + { + "epoch": 0.44, + "grad_norm": 7.430248737335205, + "learning_rate": 2e-05, + "loss": 0.3365, + "step": 44 + }, + { + "epoch": 0.46, + "grad_norm": 0.007363118231296539, + "learning_rate": 2e-05, + "loss": 0.0007, + "step": 46 + }, + { + "epoch": 0.48, + "grad_norm": 0.22596396505832672, + "learning_rate": 2e-05, + "loss": 0.0028, + "step": 48 + }, + { + "epoch": 0.5, + "grad_norm": 0.011090992018580437, + "learning_rate": 2e-05, + "loss": 0.0082, + "step": 50 + }, + { + "epoch": 0.52, + "grad_norm": 0.002775605069473386, + "learning_rate": 2e-05, + "loss": 0.0144, + "step": 52 + }, + { + "epoch": 0.54, + "grad_norm": 0.12985211610794067, + "learning_rate": 2e-05, + "loss": 0.0036, + "step": 54 + }, + { + "epoch": 0.56, + "grad_norm": 0.00687048677355051, + "learning_rate": 2e-05, + "loss": 0.0506, + "step": 56 + }, + { + "epoch": 0.58, + "grad_norm": 0.1465214043855667, + "learning_rate": 2e-05, + "loss": 0.6757, + "step": 58 + }, + { + "epoch": 0.6, + "grad_norm": 0.008273234590888023, + "learning_rate": 2e-05, + "loss": 0.1315, + "step": 60 + }, + { + "epoch": 0.62, + "grad_norm": 0.004378190264105797, + "learning_rate": 2e-05, + "loss": 0.0005, + "step": 62 + }, + { + "epoch": 0.64, + "grad_norm": 0.01929680071771145, + "learning_rate": 2e-05, + "loss": 0.0199, + "step": 64 + }, + { + "epoch": 0.66, + "grad_norm": 0.08087120205163956, + "learning_rate": 2e-05, + "loss": 0.0018, + "step": 66 + }, + { + "epoch": 0.68, + "grad_norm": 0.59710294008255, + "learning_rate": 2e-05, + "loss": 0.0188, + "step": 68 + }, + { + "epoch": 0.7, + "grad_norm": 0.0036440733820199966, + "learning_rate": 2e-05, + "loss": 0.0007, + "step": 70 + }, + { + "epoch": 0.72, + "grad_norm": 1.1077224016189575, + "learning_rate": 2e-05, + "loss": 0.0233, + "step": 72 + }, + { + "epoch": 0.74, + "grad_norm": 0.230132058262825, + "learning_rate": 2e-05, + "loss": 0.0057, + "step": 74 + }, + { + "epoch": 0.76, + "grad_norm": 0.05570218339562416, + "learning_rate": 2e-05, + "loss": 0.0017, + "step": 76 + }, + { + "epoch": 0.78, + "grad_norm": 8.745405197143555, + "learning_rate": 2e-05, + "loss": 0.3285, + "step": 78 + }, + { + "epoch": 0.8, + "grad_norm": 0.024981992319226265, + "learning_rate": 2e-05, + "loss": 0.0147, + "step": 80 + }, + { + "epoch": 0.82, + "grad_norm": 0.031237130984663963, + "learning_rate": 2e-05, + "loss": 0.0012, + "step": 82 + }, + { + "epoch": 0.84, + "grad_norm": 0.0025312919169664383, + "learning_rate": 2e-05, + "loss": 0.0005, + "step": 84 + }, + { + "epoch": 0.86, + "grad_norm": 0.015429472550749779, + "learning_rate": 2e-05, + "loss": 1.1335, + "step": 86 + }, + { + "epoch": 0.88, + "grad_norm": 0.017283031716942787, + "learning_rate": 2e-05, + "loss": 0.3927, + "step": 88 + }, + { + "epoch": 0.9, + "grad_norm": 0.5121035575866699, + "learning_rate": 2e-05, + "loss": 0.0129, + "step": 90 + }, + { + "epoch": 0.92, + "grad_norm": 0.03509877249598503, + "learning_rate": 2e-05, + "loss": 0.0017, + "step": 92 + }, + { + "epoch": 0.94, + "grad_norm": 0.14815396070480347, + "learning_rate": 2e-05, + "loss": 0.0033, + "step": 94 + }, + { + "epoch": 0.96, + "grad_norm": 0.7982791662216187, + "learning_rate": 2e-05, + "loss": 0.0208, + "step": 96 + }, + { + "epoch": 0.98, + "grad_norm": 0.01828967221081257, + "learning_rate": 2e-05, + "loss": 0.0008, + "step": 98 + }, + { + "epoch": 1.0, + "grad_norm": 0.028920019045472145, + "learning_rate": 2e-05, + "loss": 0.001, + "step": 100 + }, + { + "epoch": 1.0, + "step": 100, + "total_flos": 2069634366832640.0, + "train_loss": 0.08332296743988991, + "train_runtime": 107.3131, + "train_samples_per_second": 3.727, + "train_steps_per_second": 0.932 + } + ], + "logging_steps": 2, + "max_steps": 100, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2069634366832640.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round10.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a271f25c4383219ef6301579acddd1223dcff11 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da9148465a8f4cd95eb0270b16e665c42629158f33ddfd085cf012707d1ef16b +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round12.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..3530805c3bdb4dd77592d57d585a00b0924b78e5 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f056a7a7306d28976e4fde5cb1b618208f0e76c65bd6947194700673afa3716f +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round15.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..2e6d375758bb85f5f38b4f17a0fad67832282bb3 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cb3dcfd9ac4a31a6062da06d6c2a79b842c37d02bcd61f707a6b3cf697d7bd5 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round17.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..9d17fe4ec9e32559e8fe4bcaa91ea196c4e14020 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1a32667855f860745db53d430e6027c2efab2aba52ede199dfdbe120ec036ae +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round2.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..81037052396d4b46279c77f62e341109cf1e6660 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f17d877d7edb557a631aa8a8e9d7bbb5fe31cd8b8ea72023e5dd5c53d78cb51 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round20.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..1db05d30ed8efd439995d048a71ae0516da55e5a --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bea7e9f04931f33c56745ae1d45c38c1aded38837d8c0b8d3188a343789720f +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round5.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..b6abcc2fd3ad3f8b2a2778db20224a686d27cbc3 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce75e696ed202ce34673247f828b40b13467468cd3c20ad62920c876d2499b8 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round7.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..807394003f9678785464f37ade610ef8ffa1af64 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7816dd1bead642c814ff649d6f816a07e2a31ad800473f5f91e736dd8f6abb0f +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_trainer_state.json b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..7e8b09b65af992dc1a11b5d55ab2a6acba58c95a --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/2_trainer_state.json @@ -0,0 +1,392 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "grad_norm": 2.0575942993164062, + "learning_rate": 2e-05, + "loss": 0.1776, + "step": 2 + }, + { + "epoch": 0.04, + "grad_norm": 4.511972904205322, + "learning_rate": 2e-05, + "loss": 1.2725, + "step": 4 + }, + { + "epoch": 0.06, + "grad_norm": 2.5023305416107178, + "learning_rate": 2e-05, + "loss": 0.8205, + "step": 6 + }, + { + "epoch": 0.08, + "grad_norm": 4.759030818939209, + "learning_rate": 2e-05, + "loss": 1.0588, + "step": 8 + }, + { + "epoch": 0.1, + "grad_norm": 5.180241107940674, + "learning_rate": 2e-05, + "loss": 0.5701, + "step": 10 + }, + { + "epoch": 0.12, + "grad_norm": 6.446163654327393, + "learning_rate": 2e-05, + "loss": 0.9541, + "step": 12 + }, + { + "epoch": 0.14, + "grad_norm": 0.8326573967933655, + "learning_rate": 2e-05, + "loss": 0.4677, + "step": 14 + }, + { + "epoch": 0.16, + "grad_norm": 5.085803508758545, + "learning_rate": 2e-05, + "loss": 0.7075, + "step": 16 + }, + { + "epoch": 0.18, + "grad_norm": 2.1354782581329346, + "learning_rate": 2e-05, + "loss": 0.4075, + "step": 18 + }, + { + "epoch": 0.2, + "grad_norm": 4.467723846435547, + "learning_rate": 2e-05, + "loss": 1.4546, + "step": 20 + }, + { + "epoch": 0.22, + "grad_norm": 0.7991389632225037, + "learning_rate": 2e-05, + "loss": 0.1716, + "step": 22 + }, + { + "epoch": 0.24, + "grad_norm": 8.154854774475098, + "learning_rate": 2e-05, + "loss": 0.6297, + "step": 24 + }, + { + "epoch": 0.26, + "grad_norm": 8.408839225769043, + "learning_rate": 2e-05, + "loss": 0.7795, + "step": 26 + }, + { + "epoch": 0.28, + "grad_norm": 5.934333324432373, + "learning_rate": 2e-05, + "loss": 0.3573, + "step": 28 + }, + { + "epoch": 0.3, + "grad_norm": 1.385451078414917, + "learning_rate": 2e-05, + "loss": 0.1851, + "step": 30 + }, + { + "epoch": 0.32, + "grad_norm": 5.4457573890686035, + "learning_rate": 2e-05, + "loss": 0.3923, + "step": 32 + }, + { + "epoch": 0.34, + "grad_norm": 3.9038946628570557, + "learning_rate": 2e-05, + "loss": 0.5699, + "step": 34 + }, + { + "epoch": 0.36, + "grad_norm": 2.6609935760498047, + "learning_rate": 2e-05, + "loss": 0.1604, + "step": 36 + }, + { + "epoch": 0.38, + "grad_norm": 4.058396339416504, + "learning_rate": 2e-05, + "loss": 1.0164, + "step": 38 + }, + { + "epoch": 0.4, + "grad_norm": 7.083247184753418, + "learning_rate": 2e-05, + "loss": 0.6453, + "step": 40 + }, + { + "epoch": 0.42, + "grad_norm": 2.5094070434570312, + "learning_rate": 2e-05, + "loss": 0.7037, + "step": 42 + }, + { + "epoch": 0.44, + "grad_norm": 3.413587808609009, + "learning_rate": 2e-05, + "loss": 0.2112, + "step": 44 + }, + { + "epoch": 0.46, + "grad_norm": 1.3233474493026733, + "learning_rate": 2e-05, + "loss": 0.4624, + "step": 46 + }, + { + "epoch": 0.48, + "grad_norm": 0.4725527763366699, + "learning_rate": 2e-05, + "loss": 0.429, + "step": 48 + }, + { + "epoch": 0.5, + "grad_norm": 1.5021445751190186, + "learning_rate": 2e-05, + "loss": 0.1492, + "step": 50 + }, + { + "epoch": 0.52, + "grad_norm": 7.261585235595703, + "learning_rate": 2e-05, + "loss": 0.8084, + "step": 52 + }, + { + "epoch": 0.54, + "grad_norm": 7.5004377365112305, + "learning_rate": 2e-05, + "loss": 0.585, + "step": 54 + }, + { + "epoch": 0.56, + "grad_norm": 9.127928733825684, + "learning_rate": 2e-05, + "loss": 0.7318, + "step": 56 + }, + { + "epoch": 0.58, + "grad_norm": 3.533341407775879, + "learning_rate": 2e-05, + "loss": 0.153, + "step": 58 + }, + { + "epoch": 0.6, + "grad_norm": 0.16624395549297333, + "learning_rate": 2e-05, + "loss": 0.1535, + "step": 60 + }, + { + "epoch": 0.62, + "grad_norm": 2.0703632831573486, + "learning_rate": 2e-05, + "loss": 0.7659, + "step": 62 + }, + { + "epoch": 0.64, + "grad_norm": 5.86838436126709, + "learning_rate": 2e-05, + "loss": 0.5777, + "step": 64 + }, + { + "epoch": 0.66, + "grad_norm": 2.4951283931732178, + "learning_rate": 2e-05, + "loss": 0.137, + "step": 66 + }, + { + "epoch": 0.68, + "grad_norm": 3.6449482440948486, + "learning_rate": 2e-05, + "loss": 0.3761, + "step": 68 + }, + { + "epoch": 0.7, + "grad_norm": 4.749931335449219, + "learning_rate": 2e-05, + "loss": 0.7073, + "step": 70 + }, + { + "epoch": 0.72, + "grad_norm": 0.8903286457061768, + "learning_rate": 2e-05, + "loss": 0.7262, + "step": 72 + }, + { + "epoch": 0.74, + "grad_norm": 0.5491483807563782, + "learning_rate": 2e-05, + "loss": 0.0311, + "step": 74 + }, + { + "epoch": 0.76, + "grad_norm": 0.6490838527679443, + "learning_rate": 2e-05, + "loss": 0.168, + "step": 76 + }, + { + "epoch": 0.78, + "grad_norm": 2.041003704071045, + "learning_rate": 2e-05, + "loss": 0.1247, + "step": 78 + }, + { + "epoch": 0.8, + "grad_norm": 16.038522720336914, + "learning_rate": 2e-05, + "loss": 1.7644, + "step": 80 + }, + { + "epoch": 0.82, + "grad_norm": 14.096282958984375, + "learning_rate": 2e-05, + "loss": 2.9032, + "step": 82 + }, + { + "epoch": 0.84, + "grad_norm": 0.6244635581970215, + "learning_rate": 2e-05, + "loss": 0.0249, + "step": 84 + }, + { + "epoch": 0.86, + "grad_norm": 5.987948417663574, + "learning_rate": 2e-05, + "loss": 0.5752, + "step": 86 + }, + { + "epoch": 0.88, + "grad_norm": 5.380762577056885, + "learning_rate": 2e-05, + "loss": 0.5555, + "step": 88 + }, + { + "epoch": 0.9, + "grad_norm": 5.882531642913818, + "learning_rate": 2e-05, + "loss": 1.6443, + "step": 90 + }, + { + "epoch": 0.92, + "grad_norm": 0.13828590512275696, + "learning_rate": 2e-05, + "loss": 0.2562, + "step": 92 + }, + { + "epoch": 0.94, + "grad_norm": 6.185029029846191, + "learning_rate": 2e-05, + "loss": 0.5181, + "step": 94 + }, + { + "epoch": 0.96, + "grad_norm": 3.6633758544921875, + "learning_rate": 2e-05, + "loss": 0.2768, + "step": 96 + }, + { + "epoch": 0.98, + "grad_norm": 10.242522239685059, + "learning_rate": 2e-05, + "loss": 1.9668, + "step": 98 + }, + { + "epoch": 1.0, + "grad_norm": 2.074227809906006, + "learning_rate": 2e-05, + "loss": 0.1758, + "step": 100 + }, + { + "epoch": 1.0, + "step": 100, + "total_flos": 4914533793529856.0, + "train_loss": 0.6292184376716614, + "train_runtime": 177.8526, + "train_samples_per_second": 2.249, + "train_steps_per_second": 0.562 + } + ], + "logging_steps": 2, + "max_steps": 100, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 4914533793529856.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round10.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..c567dc78a4fada19e5e71937b9729c2554f24198 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1caed849bb9462392a855436bd239bff51df5a0a602ded2c64eee5b5fb3a80d +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round12.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..55582adab194d5f752c9322948e076261ae7e815 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00879f5a55a113c84b67ee13645a3a39a68074762b9efe2023779ed5a48fdd93 +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round15.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..9ff0827b397e7f73394b28142fd10ced492e3e70 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3dab260c08d06e7dfbe65867448b5575dac4f9f5dbee4f39a0eed137f16c14c +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round17.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..cc893b6df7854d828b85fcecf23d5182a9ec19f0 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebab4b60f08b0096b0f6c1e817927c47708d879e863a55b8a74af0b5381fe52f +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round2.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..3b9306dc8bcbaa39469c30d4e99cd236d89fbd72 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41cdbf7fbf9f2eba9debe3b60422fad176d9bce7f11ae2c2286a9051a36cf3e0 +size 184220842 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round20.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..c28f0a91bb75edca4e603f94c2b2385815ef922e --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c14c027726c94d05b77d01aa6098b1329d6420f1a2791995dbf57cacc6eee3 +size 184221358 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round5.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..1682cf0a8def3751f9bd0da2bdb1e1bd860478e3 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa2b8e7e3a327002d47889f93e0c211dd05aabbfc43d19c6c833be387c586f1 +size 184220842 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round7.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6a2da8e28d9550872c8742666b6d646df37a726 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93c8f02b96fd7cabe7a2a0a74c6f835a0c7a5709c3048a6ae17e863f25fd1300 +size 184220842 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_trainer_state.json b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..bcfc14b4ca578350ab1feaa5ec42894d4d984120 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/3_trainer_state.json @@ -0,0 +1,392 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "grad_norm": 11.626480102539062, + "learning_rate": 2e-05, + "loss": 2.05, + "step": 2 + }, + { + "epoch": 0.04, + "grad_norm": 3.168531894683838, + "learning_rate": 2e-05, + "loss": 0.4739, + "step": 4 + }, + { + "epoch": 0.06, + "grad_norm": 8.85742473602295, + "learning_rate": 2e-05, + "loss": 1.2035, + "step": 6 + }, + { + "epoch": 0.08, + "grad_norm": 13.493270874023438, + "learning_rate": 2e-05, + "loss": 1.469, + "step": 8 + }, + { + "epoch": 0.1, + "grad_norm": 14.354758262634277, + "learning_rate": 2e-05, + "loss": 1.4982, + "step": 10 + }, + { + "epoch": 0.12, + "grad_norm": 9.80854320526123, + "learning_rate": 2e-05, + "loss": 1.6823, + "step": 12 + }, + { + "epoch": 0.14, + "grad_norm": 9.743561744689941, + "learning_rate": 2e-05, + "loss": 1.0911, + "step": 14 + }, + { + "epoch": 0.16, + "grad_norm": 8.771895408630371, + "learning_rate": 2e-05, + "loss": 0.8212, + "step": 16 + }, + { + "epoch": 0.18, + "grad_norm": 9.498795509338379, + "learning_rate": 2e-05, + "loss": 0.5289, + "step": 18 + }, + { + "epoch": 0.2, + "grad_norm": 3.34366774559021, + "learning_rate": 2e-05, + "loss": 0.8355, + "step": 20 + }, + { + "epoch": 0.22, + "grad_norm": 7.088817119598389, + "learning_rate": 2e-05, + "loss": 0.7599, + "step": 22 + }, + { + "epoch": 0.24, + "grad_norm": 5.744113922119141, + "learning_rate": 2e-05, + "loss": 0.9473, + "step": 24 + }, + { + "epoch": 0.26, + "grad_norm": 2.3298373222351074, + "learning_rate": 2e-05, + "loss": 0.434, + "step": 26 + }, + { + "epoch": 0.28, + "grad_norm": 7.713898181915283, + "learning_rate": 2e-05, + "loss": 0.429, + "step": 28 + }, + { + "epoch": 0.3, + "grad_norm": 9.572039604187012, + "learning_rate": 2e-05, + "loss": 0.9164, + "step": 30 + }, + { + "epoch": 0.32, + "grad_norm": 22.07094383239746, + "learning_rate": 2e-05, + "loss": 1.9406, + "step": 32 + }, + { + "epoch": 0.34, + "grad_norm": 3.5470852851867676, + "learning_rate": 2e-05, + "loss": 2.0393, + "step": 34 + }, + { + "epoch": 0.36, + "grad_norm": 13.401988983154297, + "learning_rate": 2e-05, + "loss": 2.3097, + "step": 36 + }, + { + "epoch": 0.38, + "grad_norm": 7.751951694488525, + "learning_rate": 2e-05, + "loss": 1.1857, + "step": 38 + }, + { + "epoch": 0.4, + "grad_norm": 5.891435623168945, + "learning_rate": 2e-05, + "loss": 1.2277, + "step": 40 + }, + { + "epoch": 0.42, + "grad_norm": 17.701826095581055, + "learning_rate": 2e-05, + "loss": 1.5125, + "step": 42 + }, + { + "epoch": 0.44, + "grad_norm": 14.625367164611816, + "learning_rate": 2e-05, + "loss": 1.5429, + "step": 44 + }, + { + "epoch": 0.46, + "grad_norm": 7.432581424713135, + "learning_rate": 2e-05, + "loss": 0.6927, + "step": 46 + }, + { + "epoch": 0.48, + "grad_norm": 5.332671642303467, + "learning_rate": 2e-05, + "loss": 0.518, + "step": 48 + }, + { + "epoch": 0.5, + "grad_norm": 6.91637659072876, + "learning_rate": 2e-05, + "loss": 1.067, + "step": 50 + }, + { + "epoch": 0.52, + "grad_norm": 8.855731964111328, + "learning_rate": 2e-05, + "loss": 2.106, + "step": 52 + }, + { + "epoch": 0.54, + "grad_norm": 1.1896896362304688, + "learning_rate": 2e-05, + "loss": 0.7944, + "step": 54 + }, + { + "epoch": 0.56, + "grad_norm": 2.625309467315674, + "learning_rate": 2e-05, + "loss": 0.7708, + "step": 56 + }, + { + "epoch": 0.58, + "grad_norm": 6.494451999664307, + "learning_rate": 2e-05, + "loss": 0.8268, + "step": 58 + }, + { + "epoch": 0.6, + "grad_norm": 8.12104606628418, + "learning_rate": 2e-05, + "loss": 1.4391, + "step": 60 + }, + { + "epoch": 0.62, + "grad_norm": 6.43969202041626, + "learning_rate": 2e-05, + "loss": 0.7089, + "step": 62 + }, + { + "epoch": 0.64, + "grad_norm": 6.886626243591309, + "learning_rate": 2e-05, + "loss": 0.7891, + "step": 64 + }, + { + "epoch": 0.66, + "grad_norm": 6.742187976837158, + "learning_rate": 2e-05, + "loss": 1.0454, + "step": 66 + }, + { + "epoch": 0.68, + "grad_norm": 5.596505641937256, + "learning_rate": 2e-05, + "loss": 1.119, + "step": 68 + }, + { + "epoch": 0.7, + "grad_norm": 6.840418815612793, + "learning_rate": 2e-05, + "loss": 1.1935, + "step": 70 + }, + { + "epoch": 0.72, + "grad_norm": 9.243856430053711, + "learning_rate": 2e-05, + "loss": 2.1952, + "step": 72 + }, + { + "epoch": 0.74, + "grad_norm": 7.282166957855225, + "learning_rate": 2e-05, + "loss": 1.2137, + "step": 74 + }, + { + "epoch": 0.76, + "grad_norm": 16.72466468811035, + "learning_rate": 2e-05, + "loss": 1.4145, + "step": 76 + }, + { + "epoch": 0.78, + "grad_norm": 7.7932353019714355, + "learning_rate": 2e-05, + "loss": 0.7947, + "step": 78 + }, + { + "epoch": 0.8, + "grad_norm": 10.55909538269043, + "learning_rate": 2e-05, + "loss": 0.9934, + "step": 80 + }, + { + "epoch": 0.82, + "grad_norm": 4.435039520263672, + "learning_rate": 2e-05, + "loss": 0.2408, + "step": 82 + }, + { + "epoch": 0.84, + "grad_norm": 5.173746585845947, + "learning_rate": 2e-05, + "loss": 0.4114, + "step": 84 + }, + { + "epoch": 0.86, + "grad_norm": 4.682281970977783, + "learning_rate": 2e-05, + "loss": 1.0906, + "step": 86 + }, + { + "epoch": 0.88, + "grad_norm": 4.184356689453125, + "learning_rate": 2e-05, + "loss": 0.9139, + "step": 88 + }, + { + "epoch": 0.9, + "grad_norm": 7.258085250854492, + "learning_rate": 2e-05, + "loss": 0.8793, + "step": 90 + }, + { + "epoch": 0.92, + "grad_norm": 9.776921272277832, + "learning_rate": 2e-05, + "loss": 0.5706, + "step": 92 + }, + { + "epoch": 0.94, + "grad_norm": 7.206700801849365, + "learning_rate": 2e-05, + "loss": 0.6475, + "step": 94 + }, + { + "epoch": 0.96, + "grad_norm": 5.574616432189941, + "learning_rate": 2e-05, + "loss": 0.3655, + "step": 96 + }, + { + "epoch": 0.98, + "grad_norm": 7.361481189727783, + "learning_rate": 2e-05, + "loss": 1.1062, + "step": 98 + }, + { + "epoch": 1.0, + "grad_norm": 8.203963279724121, + "learning_rate": 2e-05, + "loss": 1.1724, + "step": 100 + }, + { + "epoch": 1.0, + "step": 100, + "total_flos": 2097655350034432.0, + "train_loss": 1.0795783376693726, + "train_runtime": 105.8553, + "train_samples_per_second": 3.779, + "train_steps_per_second": 0.945 + } + ], + "logging_steps": 2, + "max_steps": 100, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 2097655350034432.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round10.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..e4ad44f6a590935bf67ffdbd1867104245424688 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b4c70a43ea29ab4146dc52168d71be9bb1ee30fd66fa0570cc295895a400058 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round12.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..b034537246941454db196c8ea3e408f1421975d4 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4121df5da69f25e22324b1fae947d957965cc89060aee94c232c217c13d5a2 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round15.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c380a8b06a30922d111008f928a66afeb3ab7d2 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:652fc3cbea3aa91a5eabdf26ed9e3ba0956d061c573c80656d394a6d472a5abd +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round17.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..25344b374b39f88de02c3e008b23fb62226c0f4d --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241cf639f7184d9cad2c59c2a8bc8b97e853f9d9e1148f88a8e53c2529d3694e +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round2.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..2bbb45cd6d1e2dfd01c5fe64faac46f794345231 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7cd7d4793d455ea44d08d57f35d9f72b764bac238dafe97e35fad001f9bfec4 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round20.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..9931f773485d208c424e3992848b58957f2065cc --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7026d317cb2c5e167440fea75c22721176e3f611591e2ee55098b8e9d4093cd9 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round5.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c7f04199424ce1bdb3460687ddea0d19d4fd199 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13abd74b11414572dfa4c1f4ca4fa0fb3c8e377ebc34367b8e3be387ab0e4f1e +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round7.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..550f04f526586e5763b3599deda8d908765853ba --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0134d8b32899bce233064517b4351b730008c7edb2aa48715e4246e6929ccbce +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_trainer_state.json b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..3e2d0c0707f7a5aa810f56c4da98591010f0fc1f --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/4_trainer_state.json @@ -0,0 +1,392 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "grad_norm": 2.4937663078308105, + "learning_rate": 2e-05, + "loss": 0.3758, + "step": 2 + }, + { + "epoch": 0.04, + "grad_norm": 4.081711769104004, + "learning_rate": 2e-05, + "loss": 0.9716, + "step": 4 + }, + { + "epoch": 0.06, + "grad_norm": 1.1032688617706299, + "learning_rate": 2e-05, + "loss": 0.3824, + "step": 6 + }, + { + "epoch": 0.08, + "grad_norm": 1.991381287574768, + "learning_rate": 2e-05, + "loss": 0.6662, + "step": 8 + }, + { + "epoch": 0.1, + "grad_norm": 2.109754800796509, + "learning_rate": 2e-05, + "loss": 0.4761, + "step": 10 + }, + { + "epoch": 0.12, + "grad_norm": 2.8071582317352295, + "learning_rate": 2e-05, + "loss": 0.1944, + "step": 12 + }, + { + "epoch": 0.14, + "grad_norm": 4.594367504119873, + "learning_rate": 2e-05, + "loss": 0.6261, + "step": 14 + }, + { + "epoch": 0.16, + "grad_norm": 7.886587619781494, + "learning_rate": 2e-05, + "loss": 2.027, + "step": 16 + }, + { + "epoch": 0.18, + "grad_norm": 3.827627182006836, + "learning_rate": 2e-05, + "loss": 0.4236, + "step": 18 + }, + { + "epoch": 0.2, + "grad_norm": 6.038527011871338, + "learning_rate": 2e-05, + "loss": 0.4733, + "step": 20 + }, + { + "epoch": 0.22, + "grad_norm": 4.899626731872559, + "learning_rate": 2e-05, + "loss": 1.6886, + "step": 22 + }, + { + "epoch": 0.24, + "grad_norm": 2.1262969970703125, + "learning_rate": 2e-05, + "loss": 0.9716, + "step": 24 + }, + { + "epoch": 0.26, + "grad_norm": 3.1155662536621094, + "learning_rate": 2e-05, + "loss": 0.4385, + "step": 26 + }, + { + "epoch": 0.28, + "grad_norm": 5.111391067504883, + "learning_rate": 2e-05, + "loss": 1.064, + "step": 28 + }, + { + "epoch": 0.3, + "grad_norm": 4.286339282989502, + "learning_rate": 2e-05, + "loss": 0.8837, + "step": 30 + }, + { + "epoch": 0.32, + "grad_norm": 6.784238815307617, + "learning_rate": 2e-05, + "loss": 0.726, + "step": 32 + }, + { + "epoch": 0.34, + "grad_norm": 2.1785695552825928, + "learning_rate": 2e-05, + "loss": 0.4619, + "step": 34 + }, + { + "epoch": 0.36, + "grad_norm": 4.427624225616455, + "learning_rate": 2e-05, + "loss": 1.1757, + "step": 36 + }, + { + "epoch": 0.38, + "grad_norm": 3.2761521339416504, + "learning_rate": 2e-05, + "loss": 0.58, + "step": 38 + }, + { + "epoch": 0.4, + "grad_norm": 6.908085346221924, + "learning_rate": 2e-05, + "loss": 1.2319, + "step": 40 + }, + { + "epoch": 0.42, + "grad_norm": 3.5153822898864746, + "learning_rate": 2e-05, + "loss": 0.8656, + "step": 42 + }, + { + "epoch": 0.44, + "grad_norm": 4.410258769989014, + "learning_rate": 2e-05, + "loss": 0.6735, + "step": 44 + }, + { + "epoch": 0.46, + "grad_norm": 5.0626139640808105, + "learning_rate": 2e-05, + "loss": 0.9364, + "step": 46 + }, + { + "epoch": 0.48, + "grad_norm": 4.839291095733643, + "learning_rate": 2e-05, + "loss": 0.8002, + "step": 48 + }, + { + "epoch": 0.5, + "grad_norm": 2.034221887588501, + "learning_rate": 2e-05, + "loss": 0.455, + "step": 50 + }, + { + "epoch": 0.52, + "grad_norm": 4.509211540222168, + "learning_rate": 2e-05, + "loss": 1.578, + "step": 52 + }, + { + "epoch": 0.54, + "grad_norm": 4.306380748748779, + "learning_rate": 2e-05, + "loss": 0.7601, + "step": 54 + }, + { + "epoch": 0.56, + "grad_norm": 2.2897300720214844, + "learning_rate": 2e-05, + "loss": 0.2315, + "step": 56 + }, + { + "epoch": 0.58, + "grad_norm": 4.265103340148926, + "learning_rate": 2e-05, + "loss": 0.9205, + "step": 58 + }, + { + "epoch": 0.6, + "grad_norm": 3.1104488372802734, + "learning_rate": 2e-05, + "loss": 0.7684, + "step": 60 + }, + { + "epoch": 0.62, + "grad_norm": 3.652125597000122, + "learning_rate": 2e-05, + "loss": 0.6189, + "step": 62 + }, + { + "epoch": 0.64, + "grad_norm": 3.872218370437622, + "learning_rate": 2e-05, + "loss": 1.1104, + "step": 64 + }, + { + "epoch": 0.66, + "grad_norm": 6.816725730895996, + "learning_rate": 2e-05, + "loss": 0.9861, + "step": 66 + }, + { + "epoch": 0.68, + "grad_norm": 2.1225953102111816, + "learning_rate": 2e-05, + "loss": 0.735, + "step": 68 + }, + { + "epoch": 0.7, + "grad_norm": 7.632792949676514, + "learning_rate": 2e-05, + "loss": 0.9318, + "step": 70 + }, + { + "epoch": 0.72, + "grad_norm": 3.294650077819824, + "learning_rate": 2e-05, + "loss": 0.6072, + "step": 72 + }, + { + "epoch": 0.74, + "grad_norm": 0.8899891376495361, + "learning_rate": 2e-05, + "loss": 0.5501, + "step": 74 + }, + { + "epoch": 0.76, + "grad_norm": 3.8096601963043213, + "learning_rate": 2e-05, + "loss": 1.4906, + "step": 76 + }, + { + "epoch": 0.78, + "grad_norm": 4.652364730834961, + "learning_rate": 2e-05, + "loss": 0.7314, + "step": 78 + }, + { + "epoch": 0.8, + "grad_norm": 3.764209032058716, + "learning_rate": 2e-05, + "loss": 0.477, + "step": 80 + }, + { + "epoch": 0.82, + "grad_norm": 3.7325081825256348, + "learning_rate": 2e-05, + "loss": 0.5399, + "step": 82 + }, + { + "epoch": 0.84, + "grad_norm": 5.481297016143799, + "learning_rate": 2e-05, + "loss": 0.6222, + "step": 84 + }, + { + "epoch": 0.86, + "grad_norm": 2.3769960403442383, + "learning_rate": 2e-05, + "loss": 0.3539, + "step": 86 + }, + { + "epoch": 0.88, + "grad_norm": 3.286647081375122, + "learning_rate": 2e-05, + "loss": 0.5527, + "step": 88 + }, + { + "epoch": 0.9, + "grad_norm": 4.621764183044434, + "learning_rate": 2e-05, + "loss": 0.8604, + "step": 90 + }, + { + "epoch": 0.92, + "grad_norm": 6.542860984802246, + "learning_rate": 2e-05, + "loss": 0.7941, + "step": 92 + }, + { + "epoch": 0.94, + "grad_norm": 5.715937614440918, + "learning_rate": 2e-05, + "loss": 0.8467, + "step": 94 + }, + { + "epoch": 0.96, + "grad_norm": 2.689699411392212, + "learning_rate": 2e-05, + "loss": 0.6135, + "step": 96 + }, + { + "epoch": 0.98, + "grad_norm": 3.2868945598602295, + "learning_rate": 2e-05, + "loss": 0.2993, + "step": 98 + }, + { + "epoch": 1.0, + "grad_norm": 9.829119682312012, + "learning_rate": 2e-05, + "loss": 1.0146, + "step": 100 + }, + { + "epoch": 1.0, + "step": 100, + "total_flos": 5694661670731776.0, + "train_loss": 0.7712589836120606, + "train_runtime": 175.8339, + "train_samples_per_second": 2.275, + "train_steps_per_second": 0.569 + } + ], + "logging_steps": 2, + "max_steps": 100, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 5694661670731776.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round10.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..a70d8808b153d7f7c378f9e8add24fd29eded3e2 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3161bd2d6d5a248b0baee1ee5cbe9a242b2262e52f646cbe17844aa0b55fca59 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round12.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..d34e3a4a1fef39bed2c3767bc28b94b333926c3f --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22579505abed738cdb0fb5b0ef1fc9b48dd37c42c195aa2f2d3d60ec5c1845b8 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round15.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..140c0ca510540fb4e7efbb491b527350ce4a231e --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22bb6c6c52adb579423077b76f895b24bf560602c5a6faa57e73c62fc78e12d5 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round17.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..f4ac010bd91a9cb055b50946f9c173ba6ec8ca66 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f49b37b753ee72a6598e3ae68b9aeed992ac61fde5a802b001ec539fbff10a +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round2.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..56a1de892e5fe432ce700610d8b3f275b1691e77 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659b0e8a4fe54c54110db837608c59fff7e4e2307d5013e2e0838c49a23016c7 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round20.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..92c42d5566211751452fd704d2774c359f8dd3b9 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b51b0b72734c99dbcf28665ab376a2d1f7e4229301e3da8483c8a7a11817891 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round5.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..45fc805188325abdd6c90c4b658ab93b644d1eed --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb40142315c96623fb95d183cba2384b6732311c59e0619b9706defb70d3287 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round7.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..310033561c863e1a8c8833a6bfa810cd7d34ec9b --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2767ac5737d5388cfd774784cef2ac6fa80b70a02ed3976a33702cc021beafe1 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_trainer_state.json b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..fd0d5498bb926ab20e5b6d7dff39c3db53854b42 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/5_trainer_state.json @@ -0,0 +1,392 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "grad_norm": 2.2397685050964355, + "learning_rate": 2e-05, + "loss": 2.292, + "step": 2 + }, + { + "epoch": 0.04, + "grad_norm": 5.843800067901611, + "learning_rate": 2e-05, + "loss": 1.1023, + "step": 4 + }, + { + "epoch": 0.06, + "grad_norm": 6.766488552093506, + "learning_rate": 2e-05, + "loss": 1.7336, + "step": 6 + }, + { + "epoch": 0.08, + "grad_norm": 4.335782051086426, + "learning_rate": 2e-05, + "loss": 0.6455, + "step": 8 + }, + { + "epoch": 0.1, + "grad_norm": 1.1837608814239502, + "learning_rate": 2e-05, + "loss": 0.423, + "step": 10 + }, + { + "epoch": 0.12, + "grad_norm": 8.192780494689941, + "learning_rate": 2e-05, + "loss": 1.0187, + "step": 12 + }, + { + "epoch": 0.14, + "grad_norm": 0.3664920926094055, + "learning_rate": 2e-05, + "loss": 0.3417, + "step": 14 + }, + { + "epoch": 0.16, + "grad_norm": 4.228869438171387, + "learning_rate": 2e-05, + "loss": 0.5203, + "step": 16 + }, + { + "epoch": 0.18, + "grad_norm": 5.254748821258545, + "learning_rate": 2e-05, + "loss": 1.6189, + "step": 18 + }, + { + "epoch": 0.2, + "grad_norm": 3.801438570022583, + "learning_rate": 2e-05, + "loss": 1.9009, + "step": 20 + }, + { + "epoch": 0.22, + "grad_norm": 7.5742692947387695, + "learning_rate": 2e-05, + "loss": 3.729, + "step": 22 + }, + { + "epoch": 0.24, + "grad_norm": 6.694967269897461, + "learning_rate": 2e-05, + "loss": 1.0309, + "step": 24 + }, + { + "epoch": 0.26, + "grad_norm": 5.33902645111084, + "learning_rate": 2e-05, + "loss": 1.0557, + "step": 26 + }, + { + "epoch": 0.28, + "grad_norm": 6.450504302978516, + "learning_rate": 2e-05, + "loss": 2.9573, + "step": 28 + }, + { + "epoch": 0.3, + "grad_norm": 0.5461809635162354, + "learning_rate": 2e-05, + "loss": 0.4397, + "step": 30 + }, + { + "epoch": 0.32, + "grad_norm": 1.7676559686660767, + "learning_rate": 2e-05, + "loss": 0.3504, + "step": 32 + }, + { + "epoch": 0.34, + "grad_norm": 1.6258739233016968, + "learning_rate": 2e-05, + "loss": 0.2323, + "step": 34 + }, + { + "epoch": 0.36, + "grad_norm": 6.4592485427856445, + "learning_rate": 2e-05, + "loss": 1.3458, + "step": 36 + }, + { + "epoch": 0.38, + "grad_norm": 4.838278770446777, + "learning_rate": 2e-05, + "loss": 1.1061, + "step": 38 + }, + { + "epoch": 0.4, + "grad_norm": 4.729245662689209, + "learning_rate": 2e-05, + "loss": 0.5425, + "step": 40 + }, + { + "epoch": 0.42, + "grad_norm": 6.380265712738037, + "learning_rate": 2e-05, + "loss": 1.0131, + "step": 42 + }, + { + "epoch": 0.44, + "grad_norm": 4.9066081047058105, + "learning_rate": 2e-05, + "loss": 0.694, + "step": 44 + }, + { + "epoch": 0.46, + "grad_norm": 3.9361062049865723, + "learning_rate": 2e-05, + "loss": 0.905, + "step": 46 + }, + { + "epoch": 0.48, + "grad_norm": 8.402027130126953, + "learning_rate": 2e-05, + "loss": 3.4478, + "step": 48 + }, + { + "epoch": 0.5, + "grad_norm": 12.549633979797363, + "learning_rate": 2e-05, + "loss": 4.6732, + "step": 50 + }, + { + "epoch": 0.52, + "grad_norm": 6.691660404205322, + "learning_rate": 2e-05, + "loss": 2.3466, + "step": 52 + }, + { + "epoch": 0.54, + "grad_norm": 2.8352389335632324, + "learning_rate": 2e-05, + "loss": 0.4344, + "step": 54 + }, + { + "epoch": 0.56, + "grad_norm": 13.197033882141113, + "learning_rate": 2e-05, + "loss": 1.5281, + "step": 56 + }, + { + "epoch": 0.58, + "grad_norm": 8.325194358825684, + "learning_rate": 2e-05, + "loss": 3.1061, + "step": 58 + }, + { + "epoch": 0.6, + "grad_norm": 1.6547410488128662, + "learning_rate": 2e-05, + "loss": 0.2293, + "step": 60 + }, + { + "epoch": 0.62, + "grad_norm": 3.7957839965820312, + "learning_rate": 2e-05, + "loss": 1.207, + "step": 62 + }, + { + "epoch": 0.64, + "grad_norm": 8.382137298583984, + "learning_rate": 2e-05, + "loss": 1.7802, + "step": 64 + }, + { + "epoch": 0.66, + "grad_norm": 3.426908493041992, + "learning_rate": 2e-05, + "loss": 0.6213, + "step": 66 + }, + { + "epoch": 0.68, + "grad_norm": 3.5080995559692383, + "learning_rate": 2e-05, + "loss": 0.8321, + "step": 68 + }, + { + "epoch": 0.7, + "grad_norm": 6.940305233001709, + "learning_rate": 2e-05, + "loss": 3.2279, + "step": 70 + }, + { + "epoch": 0.72, + "grad_norm": 2.6670947074890137, + "learning_rate": 2e-05, + "loss": 2.6391, + "step": 72 + }, + { + "epoch": 0.74, + "grad_norm": 0.31503769755363464, + "learning_rate": 2e-05, + "loss": 0.425, + "step": 74 + }, + { + "epoch": 0.76, + "grad_norm": 8.10043716430664, + "learning_rate": 2e-05, + "loss": 1.127, + "step": 76 + }, + { + "epoch": 0.78, + "grad_norm": 5.141766548156738, + "learning_rate": 2e-05, + "loss": 1.7443, + "step": 78 + }, + { + "epoch": 0.8, + "grad_norm": 6.595918655395508, + "learning_rate": 2e-05, + "loss": 0.9471, + "step": 80 + }, + { + "epoch": 0.82, + "grad_norm": 4.664250373840332, + "learning_rate": 2e-05, + "loss": 0.8069, + "step": 82 + }, + { + "epoch": 0.84, + "grad_norm": 3.9759442806243896, + "learning_rate": 2e-05, + "loss": 0.7474, + "step": 84 + }, + { + "epoch": 0.86, + "grad_norm": 2.457324504852295, + "learning_rate": 2e-05, + "loss": 0.3291, + "step": 86 + }, + { + "epoch": 0.88, + "grad_norm": 7.61952543258667, + "learning_rate": 2e-05, + "loss": 0.97, + "step": 88 + }, + { + "epoch": 0.9, + "grad_norm": 5.216441631317139, + "learning_rate": 2e-05, + "loss": 0.4906, + "step": 90 + }, + { + "epoch": 0.92, + "grad_norm": 11.298141479492188, + "learning_rate": 2e-05, + "loss": 1.4305, + "step": 92 + }, + { + "epoch": 0.94, + "grad_norm": 5.80995512008667, + "learning_rate": 2e-05, + "loss": 0.6481, + "step": 94 + }, + { + "epoch": 0.96, + "grad_norm": 10.62026596069336, + "learning_rate": 2e-05, + "loss": 4.9962, + "step": 96 + }, + { + "epoch": 0.98, + "grad_norm": 0.4833526015281677, + "learning_rate": 2e-05, + "loss": 2.6791, + "step": 98 + }, + { + "epoch": 1.0, + "grad_norm": 7.135585784912109, + "learning_rate": 2e-05, + "loss": 1.5141, + "step": 100 + }, + { + "epoch": 1.0, + "step": 100, + "total_flos": 4901658932805632.0, + "train_loss": 1.4385453033447266, + "train_runtime": 175.0121, + "train_samples_per_second": 2.286, + "train_steps_per_second": 0.571 + } + ], + "logging_steps": 2, + "max_steps": 100, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 4901658932805632.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round10.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..6eca793a9da0754c6c4a7d9da597d9ff510db41e --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a960721481263eb42927b2a6d9b3d8a06e0e37266c882007aaccd9d144f995c8 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round12.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..c44377bb4aba47620f0754a97cc04f977869de55 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af80c30ddcdcc7d8c7fc4af328b1a8096f9cd89c9e5c3ff39abb389d3a2d5680 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round15.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..221fcf5af1a3b7a271d75d7cf9cbed144a752127 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb10dfc82b254b37c9e063955ab915ad8c0e730023b98208a216a0c5a33f575f +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round17.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..5b9af9fe3c920f6d1a825faffbc967c31da37efe --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac2285f4a4ee77ba01c552f2c4f99f23f410d8cd612f0043bacbc2515ce85b1 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round2.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..777da98c44cafad7a89b7a934d5270b37ec9b8b3 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac71c11e24662cc1eb98f6e478852d37f1f35829aca02c8086ef2e2d2cf3c67d +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round20.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..0ebba6d3f69cf9fd657fd16f67b11197682cad33 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:735c072caccdc1aa13be72110f491a1036ba437d7adb0c2a149980d4abf16801 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round5.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..47d62457af324c5dfb1b24654c161fe4825abffc --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cbb35c1c1f5aec45e9750707653552c0e25bed42b12ea7f87a9ec96765637f0 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round7.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..20d7dfc831b8c742e2c58f08190ed1f83dac05d0 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cdaeeef50ad48af2df84cef632102e2bc0f1d297fb0a11bd76526d94c82c144 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_trainer_state.json b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..5ee8c0dd5d5e3cd4771ca29bf63ca02dcccd9f3e --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/6_trainer_state.json @@ -0,0 +1,392 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "grad_norm": 6.307224750518799, + "learning_rate": 2e-05, + "loss": 1.115, + "step": 2 + }, + { + "epoch": 0.04, + "grad_norm": 7.356971740722656, + "learning_rate": 2e-05, + "loss": 0.9842, + "step": 4 + }, + { + "epoch": 0.06, + "grad_norm": 7.117051124572754, + "learning_rate": 2e-05, + "loss": 1.0228, + "step": 6 + }, + { + "epoch": 0.08, + "grad_norm": 2.492586135864258, + "learning_rate": 2e-05, + "loss": 0.8445, + "step": 8 + }, + { + "epoch": 0.1, + "grad_norm": 3.558971881866455, + "learning_rate": 2e-05, + "loss": 1.0108, + "step": 10 + }, + { + "epoch": 0.12, + "grad_norm": 1.3240742683410645, + "learning_rate": 2e-05, + "loss": 0.1641, + "step": 12 + }, + { + "epoch": 0.14, + "grad_norm": 5.103693008422852, + "learning_rate": 2e-05, + "loss": 0.7909, + "step": 14 + }, + { + "epoch": 0.16, + "grad_norm": 9.77467155456543, + "learning_rate": 2e-05, + "loss": 1.3086, + "step": 16 + }, + { + "epoch": 0.18, + "grad_norm": 7.322193145751953, + "learning_rate": 2e-05, + "loss": 1.9225, + "step": 18 + }, + { + "epoch": 0.2, + "grad_norm": 4.450613498687744, + "learning_rate": 2e-05, + "loss": 0.7064, + "step": 20 + }, + { + "epoch": 0.22, + "grad_norm": 4.778391361236572, + "learning_rate": 2e-05, + "loss": 0.6936, + "step": 22 + }, + { + "epoch": 0.24, + "grad_norm": 1.8592512607574463, + "learning_rate": 2e-05, + "loss": 0.5933, + "step": 24 + }, + { + "epoch": 0.26, + "grad_norm": 2.2050492763519287, + "learning_rate": 2e-05, + "loss": 0.7646, + "step": 26 + }, + { + "epoch": 0.28, + "grad_norm": 6.088590621948242, + "learning_rate": 2e-05, + "loss": 0.7946, + "step": 28 + }, + { + "epoch": 0.3, + "grad_norm": 7.113315105438232, + "learning_rate": 2e-05, + "loss": 1.4209, + "step": 30 + }, + { + "epoch": 0.32, + "grad_norm": 5.586048126220703, + "learning_rate": 2e-05, + "loss": 0.6265, + "step": 32 + }, + { + "epoch": 0.34, + "grad_norm": 2.8644750118255615, + "learning_rate": 2e-05, + "loss": 0.8747, + "step": 34 + }, + { + "epoch": 0.36, + "grad_norm": 3.1383635997772217, + "learning_rate": 2e-05, + "loss": 1.0125, + "step": 36 + }, + { + "epoch": 0.38, + "grad_norm": 2.7918667793273926, + "learning_rate": 2e-05, + "loss": 0.7816, + "step": 38 + }, + { + "epoch": 0.4, + "grad_norm": 2.3736815452575684, + "learning_rate": 2e-05, + "loss": 0.9258, + "step": 40 + }, + { + "epoch": 0.42, + "grad_norm": 3.0738043785095215, + "learning_rate": 2e-05, + "loss": 1.4477, + "step": 42 + }, + { + "epoch": 0.44, + "grad_norm": 4.376534461975098, + "learning_rate": 2e-05, + "loss": 0.5316, + "step": 44 + }, + { + "epoch": 0.46, + "grad_norm": 6.213242053985596, + "learning_rate": 2e-05, + "loss": 0.6979, + "step": 46 + }, + { + "epoch": 0.48, + "grad_norm": 4.48752498626709, + "learning_rate": 2e-05, + "loss": 0.7646, + "step": 48 + }, + { + "epoch": 0.5, + "grad_norm": 4.239739894866943, + "learning_rate": 2e-05, + "loss": 0.8866, + "step": 50 + }, + { + "epoch": 0.52, + "grad_norm": 1.9763928651809692, + "learning_rate": 2e-05, + "loss": 0.7327, + "step": 52 + }, + { + "epoch": 0.54, + "grad_norm": 4.0658416748046875, + "learning_rate": 2e-05, + "loss": 0.5961, + "step": 54 + }, + { + "epoch": 0.56, + "grad_norm": 4.59559965133667, + "learning_rate": 2e-05, + "loss": 1.6361, + "step": 56 + }, + { + "epoch": 0.58, + "grad_norm": 6.586665153503418, + "learning_rate": 2e-05, + "loss": 0.9268, + "step": 58 + }, + { + "epoch": 0.6, + "grad_norm": 4.163469314575195, + "learning_rate": 2e-05, + "loss": 1.2884, + "step": 60 + }, + { + "epoch": 0.62, + "grad_norm": 3.8198468685150146, + "learning_rate": 2e-05, + "loss": 0.6896, + "step": 62 + }, + { + "epoch": 0.64, + "grad_norm": 2.4655003547668457, + "learning_rate": 2e-05, + "loss": 0.843, + "step": 64 + }, + { + "epoch": 0.66, + "grad_norm": 2.3874995708465576, + "learning_rate": 2e-05, + "loss": 1.0933, + "step": 66 + }, + { + "epoch": 0.68, + "grad_norm": 5.565808296203613, + "learning_rate": 2e-05, + "loss": 0.916, + "step": 68 + }, + { + "epoch": 0.7, + "grad_norm": 3.9089648723602295, + "learning_rate": 2e-05, + "loss": 1.1177, + "step": 70 + }, + { + "epoch": 0.72, + "grad_norm": 2.1101279258728027, + "learning_rate": 2e-05, + "loss": 0.6678, + "step": 72 + }, + { + "epoch": 0.74, + "grad_norm": 10.827539443969727, + "learning_rate": 2e-05, + "loss": 1.4038, + "step": 74 + }, + { + "epoch": 0.76, + "grad_norm": 4.807355880737305, + "learning_rate": 2e-05, + "loss": 1.1112, + "step": 76 + }, + { + "epoch": 0.78, + "grad_norm": 2.5121877193450928, + "learning_rate": 2e-05, + "loss": 0.4111, + "step": 78 + }, + { + "epoch": 0.8, + "grad_norm": 4.019862651824951, + "learning_rate": 2e-05, + "loss": 0.4452, + "step": 80 + }, + { + "epoch": 0.82, + "grad_norm": 2.7739064693450928, + "learning_rate": 2e-05, + "loss": 0.7933, + "step": 82 + }, + { + "epoch": 0.84, + "grad_norm": 3.277104616165161, + "learning_rate": 2e-05, + "loss": 1.0657, + "step": 84 + }, + { + "epoch": 0.86, + "grad_norm": 3.6848294734954834, + "learning_rate": 2e-05, + "loss": 0.3286, + "step": 86 + }, + { + "epoch": 0.88, + "grad_norm": 2.36714768409729, + "learning_rate": 2e-05, + "loss": 0.7441, + "step": 88 + }, + { + "epoch": 0.9, + "grad_norm": 8.45163631439209, + "learning_rate": 2e-05, + "loss": 0.5177, + "step": 90 + }, + { + "epoch": 0.92, + "grad_norm": 2.2458860874176025, + "learning_rate": 2e-05, + "loss": 2.1702, + "step": 92 + }, + { + "epoch": 0.94, + "grad_norm": 3.1149096488952637, + "learning_rate": 2e-05, + "loss": 0.5806, + "step": 94 + }, + { + "epoch": 0.96, + "grad_norm": 10.000772476196289, + "learning_rate": 2e-05, + "loss": 0.811, + "step": 96 + }, + { + "epoch": 0.98, + "grad_norm": 7.507187366485596, + "learning_rate": 2e-05, + "loss": 1.3029, + "step": 98 + }, + { + "epoch": 1.0, + "grad_norm": 7.103931427001953, + "learning_rate": 2e-05, + "loss": 1.9712, + "step": 100 + }, + { + "epoch": 1.0, + "step": 100, + "total_flos": 9847400269086720.0, + "train_loss": 0.9370071792602539, + "train_runtime": 203.2202, + "train_samples_per_second": 1.968, + "train_steps_per_second": 0.492 + } + ], + "logging_steps": 2, + "max_steps": 100, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 9847400269086720.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round10.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..0dbae05aa4dbf81bbc5673806e16a7ea177acb0a --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f0c02774f5f5dee73bdf97f7adcd59162bb8939b28c1b9ee285ec8ea545451e +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round12.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..ffc01ee292ccd49125387720d2cad9cdfe017653 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b8d4c92fa77704563763c35199d7dcaa6d88d0361e22eb24f856e393fe32e96 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round15.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..c0c78c96b0a74cf0642f08db0bc862da1e978c79 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b7179833cffca777f4d652205188c0ac37a5ec1d1a8c08595cc6bbf59f1efbe +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round17.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..f9a4816f3406c150de13902f0f0e824af0181838 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad993243cb92006917d8a87c36f089c4650c9e43a099fa0b1c251a6648015884 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round2.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea7d49927d837d5a36b32a48eccb1e853aafddd4 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0383397bf45729fc92c589ee53836d747c7bade8f57914d762bc832bd9c2dfd5 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round20.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..93419a3c834abbd7d798d11f59af952982b3a9cb --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ce4191f5379bcea498d9ac70c674d6724b33124d0dc9bdf411347529b2a93a +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round5.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..345efcc5f0f2521aafc732ce699020a07efaaf8e --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ef1fafb0b5dfea4ce0e8cdc5ba1b7148bec82ebfec84dec229d1a806802be3b +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round7.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..bdfd6bf1c032c616fd17074e5f5327bd23dc5ebb --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dfa559cc92f973d9436ba8d3c63e41da2c75835e7ec0eacff25fe59a8c55cfa +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_trainer_state.json b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..eab79297242cc2e1bd72864e5ee6062a1b6d2afe --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/7_trainer_state.json @@ -0,0 +1,392 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "grad_norm": 2.075194835662842, + "learning_rate": 2e-05, + "loss": 0.2355, + "step": 2 + }, + { + "epoch": 0.04, + "grad_norm": 7.024394989013672, + "learning_rate": 2e-05, + "loss": 0.7892, + "step": 4 + }, + { + "epoch": 0.06, + "grad_norm": 4.45875883102417, + "learning_rate": 2e-05, + "loss": 0.3564, + "step": 6 + }, + { + "epoch": 0.08, + "grad_norm": 3.9380457401275635, + "learning_rate": 2e-05, + "loss": 0.6826, + "step": 8 + }, + { + "epoch": 0.1, + "grad_norm": 4.519494533538818, + "learning_rate": 2e-05, + "loss": 1.1893, + "step": 10 + }, + { + "epoch": 0.12, + "grad_norm": 0.3247454762458801, + "learning_rate": 2e-05, + "loss": 0.0948, + "step": 12 + }, + { + "epoch": 0.14, + "grad_norm": 0.7168244123458862, + "learning_rate": 2e-05, + "loss": 0.0878, + "step": 14 + }, + { + "epoch": 0.16, + "grad_norm": 3.0584566593170166, + "learning_rate": 2e-05, + "loss": 0.7045, + "step": 16 + }, + { + "epoch": 0.18, + "grad_norm": 4.258686542510986, + "learning_rate": 2e-05, + "loss": 0.3559, + "step": 18 + }, + { + "epoch": 0.2, + "grad_norm": 4.993036270141602, + "learning_rate": 2e-05, + "loss": 0.339, + "step": 20 + }, + { + "epoch": 0.22, + "grad_norm": 0.9501545429229736, + "learning_rate": 2e-05, + "loss": 0.2888, + "step": 22 + }, + { + "epoch": 0.24, + "grad_norm": 5.39394998550415, + "learning_rate": 2e-05, + "loss": 0.5399, + "step": 24 + }, + { + "epoch": 0.26, + "grad_norm": 2.806152582168579, + "learning_rate": 2e-05, + "loss": 0.1803, + "step": 26 + }, + { + "epoch": 0.28, + "grad_norm": 2.9089674949645996, + "learning_rate": 2e-05, + "loss": 0.4021, + "step": 28 + }, + { + "epoch": 0.3, + "grad_norm": 0.8899468779563904, + "learning_rate": 2e-05, + "loss": 1.0888, + "step": 30 + }, + { + "epoch": 0.32, + "grad_norm": 2.5916614532470703, + "learning_rate": 2e-05, + "loss": 0.6287, + "step": 32 + }, + { + "epoch": 0.34, + "grad_norm": 4.793196201324463, + "learning_rate": 2e-05, + "loss": 0.2232, + "step": 34 + }, + { + "epoch": 0.36, + "grad_norm": 5.91644811630249, + "learning_rate": 2e-05, + "loss": 1.0159, + "step": 36 + }, + { + "epoch": 0.38, + "grad_norm": 0.886712908744812, + "learning_rate": 2e-05, + "loss": 0.1432, + "step": 38 + }, + { + "epoch": 0.4, + "grad_norm": 10.200862884521484, + "learning_rate": 2e-05, + "loss": 1.5581, + "step": 40 + }, + { + "epoch": 0.42, + "grad_norm": 0.6580986380577087, + "learning_rate": 2e-05, + "loss": 0.7196, + "step": 42 + }, + { + "epoch": 0.44, + "grad_norm": 4.799409866333008, + "learning_rate": 2e-05, + "loss": 0.2863, + "step": 44 + }, + { + "epoch": 0.46, + "grad_norm": 3.3804738521575928, + "learning_rate": 2e-05, + "loss": 0.6672, + "step": 46 + }, + { + "epoch": 0.48, + "grad_norm": 0.5281198024749756, + "learning_rate": 2e-05, + "loss": 0.0268, + "step": 48 + }, + { + "epoch": 0.5, + "grad_norm": 0.2971135079860687, + "learning_rate": 2e-05, + "loss": 1.136, + "step": 50 + }, + { + "epoch": 0.52, + "grad_norm": 3.925748586654663, + "learning_rate": 2e-05, + "loss": 1.2607, + "step": 52 + }, + { + "epoch": 0.54, + "grad_norm": 0.07698030769824982, + "learning_rate": 2e-05, + "loss": 0.8335, + "step": 54 + }, + { + "epoch": 0.56, + "grad_norm": 0.6261088252067566, + "learning_rate": 2e-05, + "loss": 0.0457, + "step": 56 + }, + { + "epoch": 0.58, + "grad_norm": 0.6530467867851257, + "learning_rate": 2e-05, + "loss": 0.3342, + "step": 58 + }, + { + "epoch": 0.6, + "grad_norm": 11.174809455871582, + "learning_rate": 2e-05, + "loss": 2.2703, + "step": 60 + }, + { + "epoch": 0.62, + "grad_norm": 0.7203944325447083, + "learning_rate": 2e-05, + "loss": 0.1156, + "step": 62 + }, + { + "epoch": 0.64, + "grad_norm": 5.600475788116455, + "learning_rate": 2e-05, + "loss": 0.9326, + "step": 64 + }, + { + "epoch": 0.66, + "grad_norm": 1.8899449110031128, + "learning_rate": 2e-05, + "loss": 0.2164, + "step": 66 + }, + { + "epoch": 0.68, + "grad_norm": 2.4691033363342285, + "learning_rate": 2e-05, + "loss": 0.2476, + "step": 68 + }, + { + "epoch": 0.7, + "grad_norm": 6.158054351806641, + "learning_rate": 2e-05, + "loss": 0.8985, + "step": 70 + }, + { + "epoch": 0.72, + "grad_norm": 4.086432933807373, + "learning_rate": 2e-05, + "loss": 0.6389, + "step": 72 + }, + { + "epoch": 0.74, + "grad_norm": 5.535611152648926, + "learning_rate": 2e-05, + "loss": 0.8095, + "step": 74 + }, + { + "epoch": 0.76, + "grad_norm": 1.199110507965088, + "learning_rate": 2e-05, + "loss": 0.7349, + "step": 76 + }, + { + "epoch": 0.78, + "grad_norm": 1.6551374197006226, + "learning_rate": 2e-05, + "loss": 0.6597, + "step": 78 + }, + { + "epoch": 0.8, + "grad_norm": 8.437272071838379, + "learning_rate": 2e-05, + "loss": 1.8802, + "step": 80 + }, + { + "epoch": 0.82, + "grad_norm": 2.3758037090301514, + "learning_rate": 2e-05, + "loss": 0.2584, + "step": 82 + }, + { + "epoch": 0.84, + "grad_norm": 3.262869358062744, + "learning_rate": 2e-05, + "loss": 0.3643, + "step": 84 + }, + { + "epoch": 0.86, + "grad_norm": 3.8833999633789062, + "learning_rate": 2e-05, + "loss": 1.4019, + "step": 86 + }, + { + "epoch": 0.88, + "grad_norm": 7.607229709625244, + "learning_rate": 2e-05, + "loss": 1.242, + "step": 88 + }, + { + "epoch": 0.9, + "grad_norm": 2.9136269092559814, + "learning_rate": 2e-05, + "loss": 1.145, + "step": 90 + }, + { + "epoch": 0.92, + "grad_norm": 0.8148103356361389, + "learning_rate": 2e-05, + "loss": 0.2827, + "step": 92 + }, + { + "epoch": 0.94, + "grad_norm": 2.1555514335632324, + "learning_rate": 2e-05, + "loss": 0.2034, + "step": 94 + }, + { + "epoch": 0.96, + "grad_norm": 0.28481525182724, + "learning_rate": 2e-05, + "loss": 0.2578, + "step": 96 + }, + { + "epoch": 0.98, + "grad_norm": 2.7964327335357666, + "learning_rate": 2e-05, + "loss": 0.3366, + "step": 98 + }, + { + "epoch": 1.0, + "grad_norm": 4.562732219696045, + "learning_rate": 2e-05, + "loss": 0.3768, + "step": 100 + }, + { + "epoch": 1.0, + "step": 100, + "total_flos": 5158236269314048.0, + "train_loss": 0.6297415280342102, + "train_runtime": 176.8315, + "train_samples_per_second": 2.262, + "train_steps_per_second": 0.566 + } + ], + "logging_steps": 2, + "max_steps": 100, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 5158236269314048.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round10.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round10.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f7fd3cddb24af9c263a51736b1f0a946e41a720 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:934c0095c5882d5474db44973d866edc1133621afecf3313a77eb3e9255fdad6 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round12.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round12.pth new file mode 100644 index 0000000000000000000000000000000000000000..49eb3714997ff8aade1773225ecb12286c79f7a8 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba7e5848862fd42a6eaf5010de537b8280cc984b25a5f119e7b4f85f6284d5c3 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round15.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round15.pth new file mode 100644 index 0000000000000000000000000000000000000000..06d37857cd66f6faa5e6cae0f93c2df57d65b391 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9229bba1a8f4a807efd4ce5fb6fbd8c00fae517f67ef6392cea0cc60c8a1f9 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round17.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round17.pth new file mode 100644 index 0000000000000000000000000000000000000000..6160567cf662fc83d55a92eab03d22dff6c43984 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f7612aae3872b4e58b054db5064329b52aaed8cab0d3c30897543ada1af1fa2 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round2.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round2.pth new file mode 100644 index 0000000000000000000000000000000000000000..f7dee50088ea63f1e5587c94a2c7bec1c7c5d908 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78a3bdab4880f300e6a13ad0860485255d76aa6fd73adfe5c7fd9fcba536a59c +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round20.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round20.pth new file mode 100644 index 0000000000000000000000000000000000000000..1f4ba6adbc59dd393fe19aca0072e0fc99a80e18 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d034fce7a2b4bc47afa15e48d0fcdf214a64df5f2a669c0ee2763131b998a3 +size 395787774 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round5.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round5.pth new file mode 100644 index 0000000000000000000000000000000000000000..467c3b5e82932df85631608b73a01b2803a4e5ad --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754ffb94594a35013a54e9629add0d47c127d4e19df79ced8feef4ac289a7c21 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round7.pth b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round7.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d691ee7fcb6a4b960673e8bc1172f65b2f28d59 --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_client_model_round7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7483c227341b694212723920c3de94e37bfac540fdaab3cd067085367237423 +size 395786922 diff --git a/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_trainer_state.json b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..3251513e76566d3ec09d0f7e12ef467f29b26b4f --- /dev/null +++ b/client_states_fedMulti05pqfullfreeze_homoAgg_pca_bs4_saveoptim_lr2e-5_5e-5_sc315_4tasks_5rounds_fixitr100_T0125_decay099/8_trainer_state.json @@ -0,0 +1,392 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 100, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.02, + "grad_norm": 0.08565213531255722, + "learning_rate": 2e-05, + "loss": 0.7344, + "step": 2 + }, + { + "epoch": 0.04, + "grad_norm": 0.06497110426425934, + "learning_rate": 2e-05, + "loss": 0.1216, + "step": 4 + }, + { + "epoch": 0.06, + "grad_norm": 0.1544884890317917, + "learning_rate": 2e-05, + "loss": 0.101, + "step": 6 + }, + { + "epoch": 0.08, + "grad_norm": 2.355877637863159, + "learning_rate": 2e-05, + "loss": 0.428, + "step": 8 + }, + { + "epoch": 0.1, + "grad_norm": 0.06318658590316772, + "learning_rate": 2e-05, + "loss": 0.004, + "step": 10 + }, + { + "epoch": 0.12, + "grad_norm": 2.7905097007751465, + "learning_rate": 2e-05, + "loss": 0.1847, + "step": 12 + }, + { + "epoch": 0.14, + "grad_norm": 0.10775388032197952, + "learning_rate": 2e-05, + "loss": 0.4969, + "step": 14 + }, + { + "epoch": 0.16, + "grad_norm": 9.429287910461426, + "learning_rate": 2e-05, + "loss": 1.1262, + "step": 16 + }, + { + "epoch": 0.18, + "grad_norm": 2.2753570079803467, + "learning_rate": 2e-05, + "loss": 0.2309, + "step": 18 + }, + { + "epoch": 0.2, + "grad_norm": 6.7658185958862305, + "learning_rate": 2e-05, + "loss": 4.0641, + "step": 20 + }, + { + "epoch": 0.22, + "grad_norm": 4.763914108276367, + "learning_rate": 2e-05, + "loss": 0.6948, + "step": 22 + }, + { + "epoch": 0.24, + "grad_norm": 1.2038241624832153, + "learning_rate": 2e-05, + "loss": 0.5692, + "step": 24 + }, + { + "epoch": 0.26, + "grad_norm": 1.3842836618423462, + "learning_rate": 2e-05, + "loss": 0.1697, + "step": 26 + }, + { + "epoch": 0.28, + "grad_norm": 2.252963066101074, + "learning_rate": 2e-05, + "loss": 0.1263, + "step": 28 + }, + { + "epoch": 0.3, + "grad_norm": 4.557061195373535, + "learning_rate": 2e-05, + "loss": 0.2119, + "step": 30 + }, + { + "epoch": 0.32, + "grad_norm": 0.14750222861766815, + "learning_rate": 2e-05, + "loss": 0.011, + "step": 32 + }, + { + "epoch": 0.34, + "grad_norm": 4.016882419586182, + "learning_rate": 2e-05, + "loss": 1.6461, + "step": 34 + }, + { + "epoch": 0.36, + "grad_norm": 1.9945074319839478, + "learning_rate": 2e-05, + "loss": 0.6854, + "step": 36 + }, + { + "epoch": 0.38, + "grad_norm": 5.750539302825928, + "learning_rate": 2e-05, + "loss": 1.0438, + "step": 38 + }, + { + "epoch": 0.4, + "grad_norm": 2.6533830165863037, + "learning_rate": 2e-05, + "loss": 1.012, + "step": 40 + }, + { + "epoch": 0.42, + "grad_norm": 8.021306037902832, + "learning_rate": 2e-05, + "loss": 0.956, + "step": 42 + }, + { + "epoch": 0.44, + "grad_norm": 0.0037975588347762823, + "learning_rate": 2e-05, + "loss": 0.1428, + "step": 44 + }, + { + "epoch": 0.46, + "grad_norm": 4.191558837890625, + "learning_rate": 2e-05, + "loss": 0.7227, + "step": 46 + }, + { + "epoch": 0.48, + "grad_norm": 5.117783546447754, + "learning_rate": 2e-05, + "loss": 0.8492, + "step": 48 + }, + { + "epoch": 0.5, + "grad_norm": 0.8057326078414917, + "learning_rate": 2e-05, + "loss": 0.4933, + "step": 50 + }, + { + "epoch": 0.52, + "grad_norm": 0.07272912561893463, + "learning_rate": 2e-05, + "loss": 0.4327, + "step": 52 + }, + { + "epoch": 0.54, + "grad_norm": 0.5037710666656494, + "learning_rate": 2e-05, + "loss": 0.8718, + "step": 54 + }, + { + "epoch": 0.56, + "grad_norm": 2.6512057781219482, + "learning_rate": 2e-05, + "loss": 0.809, + "step": 56 + }, + { + "epoch": 0.58, + "grad_norm": 1.944377064704895, + "learning_rate": 2e-05, + "loss": 0.1457, + "step": 58 + }, + { + "epoch": 0.6, + "grad_norm": 0.08046957105398178, + "learning_rate": 2e-05, + "loss": 0.0219, + "step": 60 + }, + { + "epoch": 0.62, + "grad_norm": 5.218014240264893, + "learning_rate": 2e-05, + "loss": 0.3664, + "step": 62 + }, + { + "epoch": 0.64, + "grad_norm": 8.094252586364746, + "learning_rate": 2e-05, + "loss": 1.349, + "step": 64 + }, + { + "epoch": 0.66, + "grad_norm": 3.5652830600738525, + "learning_rate": 2e-05, + "loss": 0.2475, + "step": 66 + }, + { + "epoch": 0.68, + "grad_norm": 0.16974720358848572, + "learning_rate": 2e-05, + "loss": 0.0263, + "step": 68 + }, + { + "epoch": 0.7, + "grad_norm": 0.28704845905303955, + "learning_rate": 2e-05, + "loss": 0.0293, + "step": 70 + }, + { + "epoch": 0.72, + "grad_norm": 4.832737922668457, + "learning_rate": 2e-05, + "loss": 0.3632, + "step": 72 + }, + { + "epoch": 0.74, + "grad_norm": 0.6874464154243469, + "learning_rate": 2e-05, + "loss": 0.0381, + "step": 74 + }, + { + "epoch": 0.76, + "grad_norm": 0.7270686030387878, + "learning_rate": 2e-05, + "loss": 0.0589, + "step": 76 + }, + { + "epoch": 0.78, + "grad_norm": 0.2944982349872589, + "learning_rate": 2e-05, + "loss": 0.2251, + "step": 78 + }, + { + "epoch": 0.8, + "grad_norm": 0.3541363775730133, + "learning_rate": 2e-05, + "loss": 0.1346, + "step": 80 + }, + { + "epoch": 0.82, + "grad_norm": 7.80084228515625, + "learning_rate": 2e-05, + "loss": 0.9932, + "step": 82 + }, + { + "epoch": 0.84, + "grad_norm": 0.5896197557449341, + "learning_rate": 2e-05, + "loss": 0.0312, + "step": 84 + }, + { + "epoch": 0.86, + "grad_norm": 0.227444127202034, + "learning_rate": 2e-05, + "loss": 0.0156, + "step": 86 + }, + { + "epoch": 0.88, + "grad_norm": 3.0514039993286133, + "learning_rate": 2e-05, + "loss": 0.1752, + "step": 88 + }, + { + "epoch": 0.9, + "grad_norm": 2.489921808242798, + "learning_rate": 2e-05, + "loss": 0.5978, + "step": 90 + }, + { + "epoch": 0.92, + "grad_norm": 9.141898155212402, + "learning_rate": 2e-05, + "loss": 1.3444, + "step": 92 + }, + { + "epoch": 0.94, + "grad_norm": 0.2494216114282608, + "learning_rate": 2e-05, + "loss": 0.0128, + "step": 94 + }, + { + "epoch": 0.96, + "grad_norm": 0.3338507115840912, + "learning_rate": 2e-05, + "loss": 0.1223, + "step": 96 + }, + { + "epoch": 0.98, + "grad_norm": 0.6613537669181824, + "learning_rate": 2e-05, + "loss": 0.0278, + "step": 98 + }, + { + "epoch": 1.0, + "grad_norm": 0.263392835855484, + "learning_rate": 2e-05, + "loss": 0.0347, + "step": 100 + }, + { + "epoch": 1.0, + "step": 100, + "total_flos": 5020151544020992.0, + "train_loss": 0.5060164135694504, + "train_runtime": 178.2381, + "train_samples_per_second": 2.244, + "train_steps_per_second": 0.561 + } + ], + "logging_steps": 2, + "max_steps": 100, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 5020151544020992.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +}