Jeremiah Zhou
		
	commited on
		
		
					Commit 
							
							·
						
						52163ed
	
1
								Parent(s):
							
							30c5adb
								
End of training
Browse files
    	
        all_results.json
    ADDED
    
    | @@ -0,0 +1,14 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
                "epoch": 3.0,
         | 
| 3 | 
            +
                "eval_loss": 0.5405848622322083,
         | 
| 4 | 
            +
                "eval_matthews_correlation": 0.5880094937717885,
         | 
| 5 | 
            +
                "eval_runtime": 5.0883,
         | 
| 6 | 
            +
                "eval_samples": 1043,
         | 
| 7 | 
            +
                "eval_samples_per_second": 204.979,
         | 
| 8 | 
            +
                "eval_steps_per_second": 25.745,
         | 
| 9 | 
            +
                "train_loss": 0.31582939565478274,
         | 
| 10 | 
            +
                "train_runtime": 345.3367,
         | 
| 11 | 
            +
                "train_samples": 8551,
         | 
| 12 | 
            +
                "train_samples_per_second": 74.284,
         | 
| 13 | 
            +
                "train_steps_per_second": 2.328
         | 
| 14 | 
            +
            }
         | 
    	
        eval_results.json
    ADDED
    
    | @@ -0,0 +1,9 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
                "epoch": 3.0,
         | 
| 3 | 
            +
                "eval_loss": 0.5405848622322083,
         | 
| 4 | 
            +
                "eval_matthews_correlation": 0.5880094937717885,
         | 
| 5 | 
            +
                "eval_runtime": 5.0883,
         | 
| 6 | 
            +
                "eval_samples": 1043,
         | 
| 7 | 
            +
                "eval_samples_per_second": 204.979,
         | 
| 8 | 
            +
                "eval_steps_per_second": 25.745
         | 
| 9 | 
            +
            }
         | 
    	
        runs/Jun21_21-11-15_pikachu/events.out.tfevents.1655817742.pikachu.3270481.2
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:0e0efc5f3050ce0ee3718c306aade21a40878b6826de5596cc7095f6f9a7f2b6
         | 
| 3 | 
            +
            size 375
         | 
    	
        train_results.json
    ADDED
    
    | @@ -0,0 +1,8 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
                "epoch": 3.0,
         | 
| 3 | 
            +
                "train_loss": 0.31582939565478274,
         | 
| 4 | 
            +
                "train_runtime": 345.3367,
         | 
| 5 | 
            +
                "train_samples": 8551,
         | 
| 6 | 
            +
                "train_samples_per_second": 74.284,
         | 
| 7 | 
            +
                "train_steps_per_second": 2.328
         | 
| 8 | 
            +
            }
         | 
    	
        trainer_state.json
    ADDED
    
    | @@ -0,0 +1,58 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
              "best_metric": 0.5880094937717885,
         | 
| 3 | 
            +
              "best_model_checkpoint": "./fine-tune/bert-base-uncased/cola/checkpoint-804",
         | 
| 4 | 
            +
              "epoch": 3.0,
         | 
| 5 | 
            +
              "global_step": 804,
         | 
| 6 | 
            +
              "is_hyper_param_search": false,
         | 
| 7 | 
            +
              "is_local_process_zero": true,
         | 
| 8 | 
            +
              "is_world_process_zero": true,
         | 
| 9 | 
            +
              "log_history": [
         | 
| 10 | 
            +
                {
         | 
| 11 | 
            +
                  "epoch": 1.0,
         | 
| 12 | 
            +
                  "eval_loss": 0.45977166295051575,
         | 
| 13 | 
            +
                  "eval_matthews_correlation": 0.5134946392219878,
         | 
| 14 | 
            +
                  "eval_runtime": 5.9561,
         | 
| 15 | 
            +
                  "eval_samples_per_second": 175.115,
         | 
| 16 | 
            +
                  "eval_steps_per_second": 21.994,
         | 
| 17 | 
            +
                  "step": 268
         | 
| 18 | 
            +
                },
         | 
| 19 | 
            +
                {
         | 
| 20 | 
            +
                  "epoch": 1.87,
         | 
| 21 | 
            +
                  "learning_rate": 7.5621890547263685e-06,
         | 
| 22 | 
            +
                  "loss": 0.393,
         | 
| 23 | 
            +
                  "step": 500
         | 
| 24 | 
            +
                },
         | 
| 25 | 
            +
                {
         | 
| 26 | 
            +
                  "epoch": 2.0,
         | 
| 27 | 
            +
                  "eval_loss": 0.4875448942184448,
         | 
| 28 | 
            +
                  "eval_matthews_correlation": 0.5573424050983508,
         | 
| 29 | 
            +
                  "eval_runtime": 2.8786,
         | 
| 30 | 
            +
                  "eval_samples_per_second": 362.324,
         | 
| 31 | 
            +
                  "eval_steps_per_second": 45.508,
         | 
| 32 | 
            +
                  "step": 536
         | 
| 33 | 
            +
                },
         | 
| 34 | 
            +
                {
         | 
| 35 | 
            +
                  "epoch": 3.0,
         | 
| 36 | 
            +
                  "eval_loss": 0.5405848622322083,
         | 
| 37 | 
            +
                  "eval_matthews_correlation": 0.5880094937717885,
         | 
| 38 | 
            +
                  "eval_runtime": 5.5175,
         | 
| 39 | 
            +
                  "eval_samples_per_second": 189.036,
         | 
| 40 | 
            +
                  "eval_steps_per_second": 23.743,
         | 
| 41 | 
            +
                  "step": 804
         | 
| 42 | 
            +
                },
         | 
| 43 | 
            +
                {
         | 
| 44 | 
            +
                  "epoch": 3.0,
         | 
| 45 | 
            +
                  "step": 804,
         | 
| 46 | 
            +
                  "total_flos": 1687396975787520.0,
         | 
| 47 | 
            +
                  "train_loss": 0.31582939565478274,
         | 
| 48 | 
            +
                  "train_runtime": 345.3367,
         | 
| 49 | 
            +
                  "train_samples_per_second": 74.284,
         | 
| 50 | 
            +
                  "train_steps_per_second": 2.328
         | 
| 51 | 
            +
                }
         | 
| 52 | 
            +
              ],
         | 
| 53 | 
            +
              "max_steps": 804,
         | 
| 54 | 
            +
              "num_train_epochs": 3,
         | 
| 55 | 
            +
              "total_flos": 1687396975787520.0,
         | 
| 56 | 
            +
              "trial_name": null,
         | 
| 57 | 
            +
              "trial_params": null
         | 
| 58 | 
            +
            }
         |