jnmrr commited on Aug 14

Commit

d5038e0

verified ·

1 Parent(s): 3a530fe

Upload RT-DETRv2 voucher classifier

Browse files

Files changed (44) hide show

README.md +15 -15
checkpoint-3520/config.json +129 -0
checkpoint-3520/model.safetensors +3 -0
checkpoint-3520/optimizer.pt +3 -0
checkpoint-3520/preprocessor_config.json +26 -0
checkpoint-3520/rng_state.pth +3 -0
checkpoint-3520/scheduler.pt +3 -0
checkpoint-3520/trainer_state.json +482 -0
checkpoint-3520/training_args.bin +3 -0
checkpoint-3740/config.json +129 -0
checkpoint-3740/model.safetensors +3 -0
checkpoint-3740/optimizer.pt +3 -0
checkpoint-3740/preprocessor_config.json +26 -0
checkpoint-3740/rng_state.pth +3 -0
checkpoint-3740/scheduler.pt +3 -0
checkpoint-3740/trainer_state.json +510 -0
checkpoint-3740/training_args.bin +3 -0
checkpoint-3960/config.json +129 -0
checkpoint-3960/model.safetensors +3 -0
checkpoint-3960/optimizer.pt +3 -0
checkpoint-3960/preprocessor_config.json +26 -0
checkpoint-3960/rng_state.pth +3 -0
checkpoint-3960/scheduler.pt +3 -0
checkpoint-3960/trainer_state.json +538 -0
checkpoint-3960/training_args.bin +3 -0
checkpoint-4180/config.json +129 -0
checkpoint-4180/model.safetensors +3 -0
checkpoint-4180/optimizer.pt +3 -0
checkpoint-4180/preprocessor_config.json +26 -0
checkpoint-4180/rng_state.pth +3 -0
checkpoint-4180/scheduler.pt +3 -0
checkpoint-4180/trainer_state.json +566 -0
checkpoint-4180/training_args.bin +3 -0
checkpoint-4235/config.json +129 -0
checkpoint-4235/model.safetensors +3 -0
checkpoint-4235/optimizer.pt +3 -0
checkpoint-4235/preprocessor_config.json +26 -0
checkpoint-4235/rng_state.pth +3 -0
checkpoint-4235/scheduler.pt +3 -0
checkpoint-4235/trainer_state.json +573 -0
checkpoint-4235/training_args.bin +3 -0
config.json +1 -1
model.safetensors +1 -1
training_args.bin +2 -2

README.md CHANGED Viewed

@@ -44,11 +44,11 @@ This model is a fine-tuned version of [PekingU/rtdetr_v2_r101vd](https://hugging
 **Training Configuration:**
-- **Image Size**: 800x800
-- **Batch Size**: 24
-- **Learning Rate**: 1.5e-05
 - **Weight Decay**: 0.0001
-- **Epochs**: 50
 - **Validation Split**: 0.0
 **Data Processing:**
@@ -104,26 +104,26 @@ This model is a fine-tuned version of [PekingU/rtdetr_v2_r101vd](https://hugging
 **Model Configuration:**
 - **Base model**: PekingU/rtdetr_v2_r101vd
 - **Architecture**: rtdetr_v2_r101vd
-- **Input resolution**: 800×800 pixels
-- **Training epochs**: 50
-- **Batch size**: 24
 **Training Hardware:**
-- **GPU**: NVIDIA A100-SXM4-40GB
-- **VRAM**: 39.6 GB
-- **RAM**: 83.5 GB
-- **GPU configuration**: A100 optimized
-**Training Time**: 1.18 hours
 **Training Summary:**
-- **Final training loss**: 196.0164
-- **Final learning rate**: 6.00e-08
 ### MLflow Tracking
-- **MLflow Run ID**: fe7bd26bd1b344c292d9b485139be46c
 - **MLflow Experiment**: RT-DETRv2_Voucher_Classification

 **Training Configuration:**
+- **Image Size**: 832x832
+- **Batch Size**: 28
+- **Learning Rate**: 1.4e-05
 - **Weight Decay**: 0.0001
+- **Epochs**: 55
 - **Validation Split**: 0.0
 **Data Processing:**
 **Model Configuration:**
 - **Base model**: PekingU/rtdetr_v2_r101vd
 - **Architecture**: rtdetr_v2_r101vd
+- **Input resolution**: 832×832 pixels
+- **Training epochs**: 55
+- **Batch size**: 28
 **Training Hardware:**
+- **GPU**: NVIDIA L40S
+- **VRAM**: 44.4 GB
+- **RAM**: 62.8 GB
+- **GPU configuration**: L40S optimized
+**Training Time**: 1.36 hours
 **Training Summary:**
+- **Final training loss**: 120.5679
+- **Final learning rate**: 6.88e-09
 ### MLflow Tracking
+- **MLflow Run ID**: f6bc3ebbbaa44f88bf184d07d93356ff
 - **MLflow Experiment**: RT-DETRv2_Voucher_Classification

checkpoint-3520/config.json ADDED Viewed

	@@ -0,0 +1,129 @@

+{
+  "activation_dropout": 0.0,
+  "activation_function": "silu",
+  "anchor_image_size": null,
+  "architectures": [
+    "RTDetrV2ForObjectDetection"
+  ],
+  "attention_dropout": 0.0,
+  "auxiliary_loss": true,
+  "backbone": null,
+  "backbone_config": {
+    "depths": [
+      3,
+      4,
+      23,
+      3
+    ],
+    "downsample_in_bottleneck": false,
+    "downsample_in_first_stage": false,
+    "embedding_size": 64,
+    "hidden_act": "relu",
+    "hidden_sizes": [
+      256,
+      512,
+      1024,
+      2048
+    ],
+    "layer_type": "bottleneck",
+    "model_type": "rt_detr_resnet",
+    "num_channels": 3,
+    "out_features": [
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "out_indices": [
+      2,
+      3,
+      4
+    ],
+    "stage_names": [
+      "stem",
+      "stage1",
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "torch_dtype": "float32"
+  },
+  "backbone_kwargs": null,
+  "batch_norm_eps": 1e-05,
+  "box_noise_scale": 1.0,
+  "d_model": 256,
+  "decoder_activation_function": "relu",
+  "decoder_attention_heads": 8,
+  "decoder_ffn_dim": 1024,
+  "decoder_in_channels": [
+    384,
+    384,
+    384
+  ],
+  "decoder_layers": 6,
+  "decoder_method": "default",
+  "decoder_n_levels": 3,
+  "decoder_n_points": 4,
+  "decoder_offset_scale": 0.5,
+  "disable_custom_kernels": true,
+  "dropout": 0.0,
+  "encode_proj_layers": [
+    2
+  ],
+  "encoder_activation_function": "gelu",
+  "encoder_attention_heads": 8,
+  "encoder_ffn_dim": 2048,
+  "encoder_hidden_dim": 384,
+  "encoder_in_channels": [
+    512,
+    1024,
+    2048
+  ],
+  "encoder_layers": 1,
+  "eos_coefficient": 0.0001,
+  "eval_size": null,
+  "feat_strides": [
+    8,
+    16,
+    32
+  ],
+  "focal_loss_alpha": 0.75,
+  "focal_loss_gamma": 2.0,
+  "freeze_backbone_batch_norms": true,
+  "hidden_expansion": 1.0,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_bias_prior_prob": null,
+  "initializer_range": 0.01,
+  "is_encoder_decoder": true,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "label_noise_ratio": 0.5,
+  "layer_norm_eps": 1e-05,
+  "learn_initial_query": false,
+  "matcher_alpha": 0.25,
+  "matcher_bbox_cost": 5.0,
+  "matcher_class_cost": 2.0,
+  "matcher_gamma": 2.0,
+  "matcher_giou_cost": 2.0,
+  "model_type": "rt_detr_v2",
+  "normalize_before": false,
+  "num_denoising": 100,
+  "num_feature_levels": 3,
+  "num_queries": 300,
+  "positional_encoding_temperature": 10000,
+  "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
+  "use_focal_loss": true,
+  "use_pretrained_backbone": false,
+  "use_timm_backbone": false,
+  "weight_loss_bbox": 5.0,
+  "weight_loss_giou": 2.0,
+  "weight_loss_vfl": 1.0,
+  "with_box_refine": true
+}

checkpoint-3520/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b2657b101f238e879c5f5c203f9376a3578df04ea7474324a53b19093b806f48
+size 306699044

checkpoint-3520/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:433457ca3308317df40d36d8b025ac71ae26460ca55e09f798a6958e52f2893e
+size 611580898

checkpoint-3520/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+  "do_convert_annotations": true,
+  "do_normalize": false,
+  "do_pad": false,
+  "do_rescale": true,
+  "do_resize": true,
+  "format": "coco_detection",
+  "image_mean": [
+    0.485,
+    0.456,
+    0.406
+  ],
+  "image_processor_type": "RTDetrImageProcessor",
+  "image_std": [
+    0.229,
+    0.224,
+    0.225
+  ],
+  "pad_size": null,
+  "resample": 2,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 640,
+    "width": 640
+  }
+}

checkpoint-3520/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:26d8dbc68d586ebc03d440b6f91bc263da03830b540faac657b2b67604441fdb
+size 14645

checkpoint-3520/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:36b280336c7f89ab668467fe9fe6ee1aa85c169847bd40455524a9bf18eea5dc
+size 1465

checkpoint-3520/trainer_state.json ADDED Viewed

	@@ -0,0 +1,482 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 45.714285714285715,
+  "eval_steps": 500,
+  "global_step": 3520,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 4405.81884765625,
+      "learning_rate": 3.436363636363636e-07,
+      "loss": 1357.5645,
+      "step": 55
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 5894.37841796875,
+      "learning_rate": 6.936363636363637e-07,
+      "loss": 1290.9688,
+      "step": 110
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 3667.852294921875,
+      "learning_rate": 1.0436363636363635e-06,
+      "loss": 1140.9515,
+      "step": 165
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 3578.294677734375,
+      "learning_rate": 1.3936363636363637e-06,
+      "loss": 942.618,
+      "step": 220
+    },
+    {
+      "epoch": 3.571428571428571,
+      "grad_norm": 2097.637939453125,
+      "learning_rate": 1.7436363636363636e-06,
+      "loss": 721.2856,
+      "step": 275
+    },
+    {
+      "epoch": 4.285714285714286,
+      "grad_norm": 1840.612548828125,
+      "learning_rate": 2.0936363636363636e-06,
+      "loss": 525.8542,
+      "step": 330
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 1230.875,
+      "learning_rate": 2.4436363636363636e-06,
+      "loss": 397.7722,
+      "step": 385
+    },
+    {
+      "epoch": 5.714285714285714,
+      "grad_norm": 1280.699951171875,
+      "learning_rate": 2.7936363636363637e-06,
+      "loss": 313.8322,
+      "step": 440
+    },
+    {
+      "epoch": 6.428571428571429,
+      "grad_norm": 4265.28759765625,
+      "learning_rate": 3.1436363636363637e-06,
+      "loss": 254.1449,
+      "step": 495
+    },
+    {
+      "epoch": 7.142857142857143,
+      "grad_norm": 967.1757202148438,
+      "learning_rate": 3.4936363636363633e-06,
+      "loss": 218.4529,
+      "step": 550
+    },
+    {
+      "epoch": 7.857142857142857,
+      "grad_norm": 765.2302856445312,
+      "learning_rate": 3.843636363636364e-06,
+      "loss": 197.915,
+      "step": 605
+    },
+    {
+      "epoch": 8.571428571428571,
+      "grad_norm": 700.331787109375,
+      "learning_rate": 4.193636363636364e-06,
+      "loss": 170.9019,
+      "step": 660
+    },
+    {
+      "epoch": 9.285714285714286,
+      "grad_norm": 613.8758544921875,
+      "learning_rate": 4.543636363636363e-06,
+      "loss": 154.6195,
+      "step": 715
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3405.25732421875,
+      "learning_rate": 4.893636363636364e-06,
+      "loss": 136.8394,
+      "step": 770
+    },
+    {
+      "epoch": 10.714285714285714,
+      "grad_norm": 1219.8994140625,
+      "learning_rate": 5.243636363636364e-06,
+      "loss": 116.0246,
+      "step": 825
+    },
+    {
+      "epoch": 11.428571428571429,
+      "grad_norm": 306.2723083496094,
+      "learning_rate": 5.593636363636363e-06,
+      "loss": 104.2055,
+      "step": 880
+    },
+    {
+      "epoch": 12.142857142857142,
+      "grad_norm": 288.2547302246094,
+      "learning_rate": 5.943636363636364e-06,
+      "loss": 88.9812,
+      "step": 935
+    },
+    {
+      "epoch": 12.857142857142858,
+      "grad_norm": 1016.5924682617188,
+      "learning_rate": 6.293636363636363e-06,
+      "loss": 79.9017,
+      "step": 990
+    },
+    {
+      "epoch": 13.571428571428571,
+      "grad_norm": 239.49191284179688,
+      "learning_rate": 6.643636363636363e-06,
+      "loss": 73.6932,
+      "step": 1045
+    },
+    {
+      "epoch": 14.285714285714286,
+      "grad_norm": 193.92002868652344,
+      "learning_rate": 6.993636363636364e-06,
+      "loss": 62.2018,
+      "step": 1100
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 179.0568084716797,
+      "learning_rate": 7.343636363636363e-06,
+      "loss": 54.0213,
+      "step": 1155
+    },
+    {
+      "epoch": 15.714285714285714,
+      "grad_norm": 166.02944946289062,
+      "learning_rate": 7.693636363636364e-06,
+      "loss": 48.1955,
+      "step": 1210
+    },
+    {
+      "epoch": 16.428571428571427,
+      "grad_norm": 126.53916931152344,
+      "learning_rate": 8.043636363636364e-06,
+      "loss": 43.5431,
+      "step": 1265
+    },
+    {
+      "epoch": 17.142857142857142,
+      "grad_norm": 145.61166381835938,
+      "learning_rate": 8.393636363636363e-06,
+      "loss": 41.4399,
+      "step": 1320
+    },
+    {
+      "epoch": 17.857142857142858,
+      "grad_norm": 122.2297134399414,
+      "learning_rate": 8.743636363636363e-06,
+      "loss": 35.2278,
+      "step": 1375
+    },
+    {
+      "epoch": 18.571428571428573,
+      "grad_norm": 117.88919067382812,
+      "learning_rate": 9.093636363636363e-06,
+      "loss": 31.2827,
+      "step": 1430
+    },
+    {
+      "epoch": 19.285714285714285,
+      "grad_norm": 88.52986907958984,
+      "learning_rate": 9.443636363636364e-06,
+      "loss": 28.8076,
+      "step": 1485
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 88.49090576171875,
+      "learning_rate": 9.793636363636364e-06,
+      "loss": 28.232,
+      "step": 1540
+    },
+    {
+      "epoch": 20.714285714285715,
+      "grad_norm": 114.45001983642578,
+      "learning_rate": 1.0143636363636363e-05,
+      "loss": 26.0885,
+      "step": 1595
+    },
+    {
+      "epoch": 21.428571428571427,
+      "grad_norm": 74.16987609863281,
+      "learning_rate": 1.0493636363636363e-05,
+      "loss": 24.2689,
+      "step": 1650
+    },
+    {
+      "epoch": 22.142857142857142,
+      "grad_norm": 82.25133514404297,
+      "learning_rate": 1.0843636363636363e-05,
+      "loss": 22.6963,
+      "step": 1705
+    },
+    {
+      "epoch": 22.857142857142858,
+      "grad_norm": 74.76679229736328,
+      "learning_rate": 1.1193636363636363e-05,
+      "loss": 21.3257,
+      "step": 1760
+    },
+    {
+      "epoch": 23.571428571428573,
+      "grad_norm": 68.91163635253906,
+      "learning_rate": 1.1543636363636365e-05,
+      "loss": 20.2199,
+      "step": 1815
+    },
+    {
+      "epoch": 24.285714285714285,
+      "grad_norm": 59.86214828491211,
+      "learning_rate": 1.1893636363636363e-05,
+      "loss": 19.3769,
+      "step": 1870
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 76.9339370727539,
+      "learning_rate": 1.2243636363636363e-05,
+      "loss": 18.0471,
+      "step": 1925
+    },
+    {
+      "epoch": 25.714285714285715,
+      "grad_norm": 66.16152954101562,
+      "learning_rate": 1.2593636363636363e-05,
+      "loss": 17.496,
+      "step": 1980
+    },
+    {
+      "epoch": 26.428571428571427,
+      "grad_norm": 58.77778244018555,
+      "learning_rate": 1.2943636363636363e-05,
+      "loss": 16.9468,
+      "step": 2035
+    },
+    {
+      "epoch": 27.142857142857142,
+      "grad_norm": 71.95783233642578,
+      "learning_rate": 1.3293636363636363e-05,
+      "loss": 16.3026,
+      "step": 2090
+    },
+    {
+      "epoch": 27.857142857142858,
+      "grad_norm": 131.7191619873047,
+      "learning_rate": 1.3643636363636363e-05,
+      "loss": 16.008,
+      "step": 2145
+    },
+    {
+      "epoch": 28.571428571428573,
+      "grad_norm": 81.78388977050781,
+      "learning_rate": 1.3993636363636363e-05,
+      "loss": 15.4616,
+      "step": 2200
+    },
+    {
+      "epoch": 29.285714285714285,
+      "grad_norm": 60.10112380981445,
+      "learning_rate": 1.3628501228501228e-05,
+      "loss": 15.195,
+      "step": 2255
+    },
+    {
+      "epoch": 30.0,
+      "grad_norm": 77.59001922607422,
+      "learning_rate": 1.325012285012285e-05,
+      "loss": 14.7557,
+      "step": 2310
+    },
+    {
+      "epoch": 30.714285714285715,
+      "grad_norm": 77.3856201171875,
+      "learning_rate": 1.287174447174447e-05,
+      "loss": 14.2851,
+      "step": 2365
+    },
+    {
+      "epoch": 31.428571428571427,
+      "grad_norm": 73.75492095947266,
+      "learning_rate": 1.2493366093366094e-05,
+      "loss": 13.867,
+      "step": 2420
+    },
+    {
+      "epoch": 32.142857142857146,
+      "grad_norm": 78.76831817626953,
+      "learning_rate": 1.2114987714987713e-05,
+      "loss": 13.6677,
+      "step": 2475
+    },
+    {
+      "epoch": 32.857142857142854,
+      "grad_norm": 92.99346160888672,
+      "learning_rate": 1.1736609336609336e-05,
+      "loss": 13.1851,
+      "step": 2530
+    },
+    {
+      "epoch": 33.57142857142857,
+      "grad_norm": 97.57978820800781,
+      "learning_rate": 1.1358230958230958e-05,
+      "loss": 13.5215,
+      "step": 2585
+    },
+    {
+      "epoch": 34.285714285714285,
+      "grad_norm": 63.118141174316406,
+      "learning_rate": 1.0979852579852579e-05,
+      "loss": 12.8525,
+      "step": 2640
+    },
+    {
+      "epoch": 35.0,
+      "grad_norm": 63.68766403198242,
+      "learning_rate": 1.06014742014742e-05,
+      "loss": 12.441,
+      "step": 2695
+    },
+    {
+      "epoch": 35.714285714285715,
+      "grad_norm": 70.33533477783203,
+      "learning_rate": 1.0223095823095823e-05,
+      "loss": 12.2331,
+      "step": 2750
+    },
+    {
+      "epoch": 36.42857142857143,
+      "grad_norm": 64.16197967529297,
+      "learning_rate": 9.844717444717445e-06,
+      "loss": 11.7547,
+      "step": 2805
+    },
+    {
+      "epoch": 37.142857142857146,
+      "grad_norm": 85.83612823486328,
+      "learning_rate": 9.466339066339066e-06,
+      "loss": 11.8633,
+      "step": 2860
+    },
+    {
+      "epoch": 37.857142857142854,
+      "grad_norm": 89.40387725830078,
+      "learning_rate": 9.087960687960689e-06,
+      "loss": 11.5795,
+      "step": 2915
+    },
+    {
+      "epoch": 38.57142857142857,
+      "grad_norm": 76.38651275634766,
+      "learning_rate": 8.709582309582309e-06,
+      "loss": 11.334,
+      "step": 2970
+    },
+    {
+      "epoch": 39.285714285714285,
+      "grad_norm": 110.11483764648438,
+      "learning_rate": 8.331203931203932e-06,
+      "loss": 10.805,
+      "step": 3025
+    },
+    {
+      "epoch": 40.0,
+      "grad_norm": 60.31315612792969,
+      "learning_rate": 7.952825552825553e-06,
+      "loss": 10.9056,
+      "step": 3080
+    },
+    {
+      "epoch": 40.714285714285715,
+      "grad_norm": 107.96589660644531,
+      "learning_rate": 7.574447174447175e-06,
+      "loss": 10.5828,
+      "step": 3135
+    },
+    {
+      "epoch": 41.42857142857143,
+      "grad_norm": 74.8004379272461,
+      "learning_rate": 7.1960687960687955e-06,
+      "loss": 10.2818,
+      "step": 3190
+    },
+    {
+      "epoch": 42.142857142857146,
+      "grad_norm": 54.093475341796875,
+      "learning_rate": 6.817690417690418e-06,
+      "loss": 10.0785,
+      "step": 3245
+    },
+    {
+      "epoch": 42.857142857142854,
+      "grad_norm": 115.28564453125,
+      "learning_rate": 6.439312039312039e-06,
+      "loss": 9.8794,
+      "step": 3300
+    },
+    {
+      "epoch": 43.57142857142857,
+      "grad_norm": 52.57551956176758,
+      "learning_rate": 6.06093366093366e-06,
+      "loss": 9.7072,
+      "step": 3355
+    },
+    {
+      "epoch": 44.285714285714285,
+      "grad_norm": 51.994075775146484,
+      "learning_rate": 5.682555282555282e-06,
+      "loss": 9.6015,
+      "step": 3410
+    },
+    {
+      "epoch": 45.0,
+      "grad_norm": 73.08104705810547,
+      "learning_rate": 5.304176904176904e-06,
+      "loss": 9.305,
+      "step": 3465
+    },
+    {
+      "epoch": 45.714285714285715,
+      "grad_norm": 75.5807876586914,
+      "learning_rate": 4.925798525798525e-06,
+      "loss": 9.2281,
+      "step": 3520
+    }
+  ],
+  "logging_steps": 55,
+  "max_steps": 4235,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 55,
+  "save_steps": 220,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5.541350580943258e+19,
+  "train_batch_size": 28,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3520/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99e55f6c266fb80fff7a194cd0925963d93d119d60f4443cb609bfd824b16fd5
+size 5841

checkpoint-3740/config.json ADDED Viewed

	@@ -0,0 +1,129 @@

+{
+  "activation_dropout": 0.0,
+  "activation_function": "silu",
+  "anchor_image_size": null,
+  "architectures": [
+    "RTDetrV2ForObjectDetection"
+  ],
+  "attention_dropout": 0.0,
+  "auxiliary_loss": true,
+  "backbone": null,
+  "backbone_config": {
+    "depths": [
+      3,
+      4,
+      23,
+      3
+    ],
+    "downsample_in_bottleneck": false,
+    "downsample_in_first_stage": false,
+    "embedding_size": 64,
+    "hidden_act": "relu",
+    "hidden_sizes": [
+      256,
+      512,
+      1024,
+      2048
+    ],
+    "layer_type": "bottleneck",
+    "model_type": "rt_detr_resnet",
+    "num_channels": 3,
+    "out_features": [
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "out_indices": [
+      2,
+      3,
+      4
+    ],
+    "stage_names": [
+      "stem",
+      "stage1",
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "torch_dtype": "float32"
+  },
+  "backbone_kwargs": null,
+  "batch_norm_eps": 1e-05,
+  "box_noise_scale": 1.0,
+  "d_model": 256,
+  "decoder_activation_function": "relu",
+  "decoder_attention_heads": 8,
+  "decoder_ffn_dim": 1024,
+  "decoder_in_channels": [
+    384,
+    384,
+    384
+  ],
+  "decoder_layers": 6,
+  "decoder_method": "default",
+  "decoder_n_levels": 3,
+  "decoder_n_points": 4,
+  "decoder_offset_scale": 0.5,
+  "disable_custom_kernels": true,
+  "dropout": 0.0,
+  "encode_proj_layers": [
+    2
+  ],
+  "encoder_activation_function": "gelu",
+  "encoder_attention_heads": 8,
+  "encoder_ffn_dim": 2048,
+  "encoder_hidden_dim": 384,
+  "encoder_in_channels": [
+    512,
+    1024,
+    2048
+  ],
+  "encoder_layers": 1,
+  "eos_coefficient": 0.0001,
+  "eval_size": null,
+  "feat_strides": [
+    8,
+    16,
+    32
+  ],
+  "focal_loss_alpha": 0.75,
+  "focal_loss_gamma": 2.0,
+  "freeze_backbone_batch_norms": true,
+  "hidden_expansion": 1.0,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_bias_prior_prob": null,
+  "initializer_range": 0.01,
+  "is_encoder_decoder": true,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "label_noise_ratio": 0.5,
+  "layer_norm_eps": 1e-05,
+  "learn_initial_query": false,
+  "matcher_alpha": 0.25,
+  "matcher_bbox_cost": 5.0,
+  "matcher_class_cost": 2.0,
+  "matcher_gamma": 2.0,
+  "matcher_giou_cost": 2.0,
+  "model_type": "rt_detr_v2",
+  "normalize_before": false,
+  "num_denoising": 100,
+  "num_feature_levels": 3,
+  "num_queries": 300,
+  "positional_encoding_temperature": 10000,
+  "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
+  "use_focal_loss": true,
+  "use_pretrained_backbone": false,
+  "use_timm_backbone": false,
+  "weight_loss_bbox": 5.0,
+  "weight_loss_giou": 2.0,
+  "weight_loss_vfl": 1.0,
+  "with_box_refine": true
+}

checkpoint-3740/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4a2115dbeecbf83273dba36b4193b8f3570757801340eaeb7c866bfbffb09037
+size 306699044

checkpoint-3740/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f365a587dc2edb4b370686f19f37461e6aafc04d8a63d69d08c1fac32defe3f
+size 611580898

checkpoint-3740/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+  "do_convert_annotations": true,
+  "do_normalize": false,
+  "do_pad": false,
+  "do_rescale": true,
+  "do_resize": true,
+  "format": "coco_detection",
+  "image_mean": [
+    0.485,
+    0.456,
+    0.406
+  ],
+  "image_processor_type": "RTDetrImageProcessor",
+  "image_std": [
+    0.229,
+    0.224,
+    0.225
+  ],
+  "pad_size": null,
+  "resample": 2,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 640,
+    "width": 640
+  }
+}

checkpoint-3740/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b6316449de2d4e20c95cd8aa4a3ea3cbf53eb2fa90c64079ff35a7c512a4b676
+size 14645

checkpoint-3740/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6406f311d941e8c7c17e04f9170710735679be7f5cfce6463778674b141d08ce
+size 1465

checkpoint-3740/trainer_state.json ADDED Viewed

	@@ -0,0 +1,510 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 48.57142857142857,
+  "eval_steps": 500,
+  "global_step": 3740,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 4405.81884765625,
+      "learning_rate": 3.436363636363636e-07,
+      "loss": 1357.5645,
+      "step": 55
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 5894.37841796875,
+      "learning_rate": 6.936363636363637e-07,
+      "loss": 1290.9688,
+      "step": 110
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 3667.852294921875,
+      "learning_rate": 1.0436363636363635e-06,
+      "loss": 1140.9515,
+      "step": 165
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 3578.294677734375,
+      "learning_rate": 1.3936363636363637e-06,
+      "loss": 942.618,
+      "step": 220
+    },
+    {
+      "epoch": 3.571428571428571,
+      "grad_norm": 2097.637939453125,
+      "learning_rate": 1.7436363636363636e-06,
+      "loss": 721.2856,
+      "step": 275
+    },
+    {
+      "epoch": 4.285714285714286,
+      "grad_norm": 1840.612548828125,
+      "learning_rate": 2.0936363636363636e-06,
+      "loss": 525.8542,
+      "step": 330
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 1230.875,
+      "learning_rate": 2.4436363636363636e-06,
+      "loss": 397.7722,
+      "step": 385
+    },
+    {
+      "epoch": 5.714285714285714,
+      "grad_norm": 1280.699951171875,
+      "learning_rate": 2.7936363636363637e-06,
+      "loss": 313.8322,
+      "step": 440
+    },
+    {
+      "epoch": 6.428571428571429,
+      "grad_norm": 4265.28759765625,
+      "learning_rate": 3.1436363636363637e-06,
+      "loss": 254.1449,
+      "step": 495
+    },
+    {
+      "epoch": 7.142857142857143,
+      "grad_norm": 967.1757202148438,
+      "learning_rate": 3.4936363636363633e-06,
+      "loss": 218.4529,
+      "step": 550
+    },
+    {
+      "epoch": 7.857142857142857,
+      "grad_norm": 765.2302856445312,
+      "learning_rate": 3.843636363636364e-06,
+      "loss": 197.915,
+      "step": 605
+    },
+    {
+      "epoch": 8.571428571428571,
+      "grad_norm": 700.331787109375,
+      "learning_rate": 4.193636363636364e-06,
+      "loss": 170.9019,
+      "step": 660
+    },
+    {
+      "epoch": 9.285714285714286,
+      "grad_norm": 613.8758544921875,
+      "learning_rate": 4.543636363636363e-06,
+      "loss": 154.6195,
+      "step": 715
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3405.25732421875,
+      "learning_rate": 4.893636363636364e-06,
+      "loss": 136.8394,
+      "step": 770
+    },
+    {
+      "epoch": 10.714285714285714,
+      "grad_norm": 1219.8994140625,
+      "learning_rate": 5.243636363636364e-06,
+      "loss": 116.0246,
+      "step": 825
+    },
+    {
+      "epoch": 11.428571428571429,
+      "grad_norm": 306.2723083496094,
+      "learning_rate": 5.593636363636363e-06,
+      "loss": 104.2055,
+      "step": 880
+    },
+    {
+      "epoch": 12.142857142857142,
+      "grad_norm": 288.2547302246094,
+      "learning_rate": 5.943636363636364e-06,
+      "loss": 88.9812,
+      "step": 935
+    },
+    {
+      "epoch": 12.857142857142858,
+      "grad_norm": 1016.5924682617188,
+      "learning_rate": 6.293636363636363e-06,
+      "loss": 79.9017,
+      "step": 990
+    },
+    {
+      "epoch": 13.571428571428571,
+      "grad_norm": 239.49191284179688,
+      "learning_rate": 6.643636363636363e-06,
+      "loss": 73.6932,
+      "step": 1045
+    },
+    {
+      "epoch": 14.285714285714286,
+      "grad_norm": 193.92002868652344,
+      "learning_rate": 6.993636363636364e-06,
+      "loss": 62.2018,
+      "step": 1100
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 179.0568084716797,
+      "learning_rate": 7.343636363636363e-06,
+      "loss": 54.0213,
+      "step": 1155
+    },
+    {
+      "epoch": 15.714285714285714,
+      "grad_norm": 166.02944946289062,
+      "learning_rate": 7.693636363636364e-06,
+      "loss": 48.1955,
+      "step": 1210
+    },
+    {
+      "epoch": 16.428571428571427,
+      "grad_norm": 126.53916931152344,
+      "learning_rate": 8.043636363636364e-06,
+      "loss": 43.5431,
+      "step": 1265
+    },
+    {
+      "epoch": 17.142857142857142,
+      "grad_norm": 145.61166381835938,
+      "learning_rate": 8.393636363636363e-06,
+      "loss": 41.4399,
+      "step": 1320
+    },
+    {
+      "epoch": 17.857142857142858,
+      "grad_norm": 122.2297134399414,
+      "learning_rate": 8.743636363636363e-06,
+      "loss": 35.2278,
+      "step": 1375
+    },
+    {
+      "epoch": 18.571428571428573,
+      "grad_norm": 117.88919067382812,
+      "learning_rate": 9.093636363636363e-06,
+      "loss": 31.2827,
+      "step": 1430
+    },
+    {
+      "epoch": 19.285714285714285,
+      "grad_norm": 88.52986907958984,
+      "learning_rate": 9.443636363636364e-06,
+      "loss": 28.8076,
+      "step": 1485
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 88.49090576171875,
+      "learning_rate": 9.793636363636364e-06,
+      "loss": 28.232,
+      "step": 1540
+    },
+    {
+      "epoch": 20.714285714285715,
+      "grad_norm": 114.45001983642578,
+      "learning_rate": 1.0143636363636363e-05,
+      "loss": 26.0885,
+      "step": 1595
+    },
+    {
+      "epoch": 21.428571428571427,
+      "grad_norm": 74.16987609863281,
+      "learning_rate": 1.0493636363636363e-05,
+      "loss": 24.2689,
+      "step": 1650
+    },
+    {
+      "epoch": 22.142857142857142,
+      "grad_norm": 82.25133514404297,
+      "learning_rate": 1.0843636363636363e-05,
+      "loss": 22.6963,
+      "step": 1705
+    },
+    {
+      "epoch": 22.857142857142858,
+      "grad_norm": 74.76679229736328,
+      "learning_rate": 1.1193636363636363e-05,
+      "loss": 21.3257,
+      "step": 1760
+    },
+    {
+      "epoch": 23.571428571428573,
+      "grad_norm": 68.91163635253906,
+      "learning_rate": 1.1543636363636365e-05,
+      "loss": 20.2199,
+      "step": 1815
+    },
+    {
+      "epoch": 24.285714285714285,
+      "grad_norm": 59.86214828491211,
+      "learning_rate": 1.1893636363636363e-05,
+      "loss": 19.3769,
+      "step": 1870
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 76.9339370727539,
+      "learning_rate": 1.2243636363636363e-05,
+      "loss": 18.0471,
+      "step": 1925
+    },
+    {
+      "epoch": 25.714285714285715,
+      "grad_norm": 66.16152954101562,
+      "learning_rate": 1.2593636363636363e-05,
+      "loss": 17.496,
+      "step": 1980
+    },
+    {
+      "epoch": 26.428571428571427,
+      "grad_norm": 58.77778244018555,
+      "learning_rate": 1.2943636363636363e-05,
+      "loss": 16.9468,
+      "step": 2035
+    },
+    {
+      "epoch": 27.142857142857142,
+      "grad_norm": 71.95783233642578,
+      "learning_rate": 1.3293636363636363e-05,
+      "loss": 16.3026,
+      "step": 2090
+    },
+    {
+      "epoch": 27.857142857142858,
+      "grad_norm": 131.7191619873047,
+      "learning_rate": 1.3643636363636363e-05,
+      "loss": 16.008,
+      "step": 2145
+    },
+    {
+      "epoch": 28.571428571428573,
+      "grad_norm": 81.78388977050781,
+      "learning_rate": 1.3993636363636363e-05,
+      "loss": 15.4616,
+      "step": 2200
+    },
+    {
+      "epoch": 29.285714285714285,
+      "grad_norm": 60.10112380981445,
+      "learning_rate": 1.3628501228501228e-05,
+      "loss": 15.195,
+      "step": 2255
+    },
+    {
+      "epoch": 30.0,
+      "grad_norm": 77.59001922607422,
+      "learning_rate": 1.325012285012285e-05,
+      "loss": 14.7557,
+      "step": 2310
+    },
+    {
+      "epoch": 30.714285714285715,
+      "grad_norm": 77.3856201171875,
+      "learning_rate": 1.287174447174447e-05,
+      "loss": 14.2851,
+      "step": 2365
+    },
+    {
+      "epoch": 31.428571428571427,
+      "grad_norm": 73.75492095947266,
+      "learning_rate": 1.2493366093366094e-05,
+      "loss": 13.867,
+      "step": 2420
+    },
+    {
+      "epoch": 32.142857142857146,
+      "grad_norm": 78.76831817626953,
+      "learning_rate": 1.2114987714987713e-05,
+      "loss": 13.6677,
+      "step": 2475
+    },
+    {
+      "epoch": 32.857142857142854,
+      "grad_norm": 92.99346160888672,
+      "learning_rate": 1.1736609336609336e-05,
+      "loss": 13.1851,
+      "step": 2530
+    },
+    {
+      "epoch": 33.57142857142857,
+      "grad_norm": 97.57978820800781,
+      "learning_rate": 1.1358230958230958e-05,
+      "loss": 13.5215,
+      "step": 2585
+    },
+    {
+      "epoch": 34.285714285714285,
+      "grad_norm": 63.118141174316406,
+      "learning_rate": 1.0979852579852579e-05,
+      "loss": 12.8525,
+      "step": 2640
+    },
+    {
+      "epoch": 35.0,
+      "grad_norm": 63.68766403198242,
+      "learning_rate": 1.06014742014742e-05,
+      "loss": 12.441,
+      "step": 2695
+    },
+    {
+      "epoch": 35.714285714285715,
+      "grad_norm": 70.33533477783203,
+      "learning_rate": 1.0223095823095823e-05,
+      "loss": 12.2331,
+      "step": 2750
+    },
+    {
+      "epoch": 36.42857142857143,
+      "grad_norm": 64.16197967529297,
+      "learning_rate": 9.844717444717445e-06,
+      "loss": 11.7547,
+      "step": 2805
+    },
+    {
+      "epoch": 37.142857142857146,
+      "grad_norm": 85.83612823486328,
+      "learning_rate": 9.466339066339066e-06,
+      "loss": 11.8633,
+      "step": 2860
+    },
+    {
+      "epoch": 37.857142857142854,
+      "grad_norm": 89.40387725830078,
+      "learning_rate": 9.087960687960689e-06,
+      "loss": 11.5795,
+      "step": 2915
+    },
+    {
+      "epoch": 38.57142857142857,
+      "grad_norm": 76.38651275634766,
+      "learning_rate": 8.709582309582309e-06,
+      "loss": 11.334,
+      "step": 2970
+    },
+    {
+      "epoch": 39.285714285714285,
+      "grad_norm": 110.11483764648438,
+      "learning_rate": 8.331203931203932e-06,
+      "loss": 10.805,
+      "step": 3025
+    },
+    {
+      "epoch": 40.0,
+      "grad_norm": 60.31315612792969,
+      "learning_rate": 7.952825552825553e-06,
+      "loss": 10.9056,
+      "step": 3080
+    },
+    {
+      "epoch": 40.714285714285715,
+      "grad_norm": 107.96589660644531,
+      "learning_rate": 7.574447174447175e-06,
+      "loss": 10.5828,
+      "step": 3135
+    },
+    {
+      "epoch": 41.42857142857143,
+      "grad_norm": 74.8004379272461,
+      "learning_rate": 7.1960687960687955e-06,
+      "loss": 10.2818,
+      "step": 3190
+    },
+    {
+      "epoch": 42.142857142857146,
+      "grad_norm": 54.093475341796875,
+      "learning_rate": 6.817690417690418e-06,
+      "loss": 10.0785,
+      "step": 3245
+    },
+    {
+      "epoch": 42.857142857142854,
+      "grad_norm": 115.28564453125,
+      "learning_rate": 6.439312039312039e-06,
+      "loss": 9.8794,
+      "step": 3300
+    },
+    {
+      "epoch": 43.57142857142857,
+      "grad_norm": 52.57551956176758,
+      "learning_rate": 6.06093366093366e-06,
+      "loss": 9.7072,
+      "step": 3355
+    },
+    {
+      "epoch": 44.285714285714285,
+      "grad_norm": 51.994075775146484,
+      "learning_rate": 5.682555282555282e-06,
+      "loss": 9.6015,
+      "step": 3410
+    },
+    {
+      "epoch": 45.0,
+      "grad_norm": 73.08104705810547,
+      "learning_rate": 5.304176904176904e-06,
+      "loss": 9.305,
+      "step": 3465
+    },
+    {
+      "epoch": 45.714285714285715,
+      "grad_norm": 75.5807876586914,
+      "learning_rate": 4.925798525798525e-06,
+      "loss": 9.2281,
+      "step": 3520
+    },
+    {
+      "epoch": 46.42857142857143,
+      "grad_norm": 53.319637298583984,
+      "learning_rate": 4.547420147420147e-06,
+      "loss": 8.996,
+      "step": 3575
+    },
+    {
+      "epoch": 47.142857142857146,
+      "grad_norm": 72.28289794921875,
+      "learning_rate": 4.1690417690417685e-06,
+      "loss": 9.0072,
+      "step": 3630
+    },
+    {
+      "epoch": 47.857142857142854,
+      "grad_norm": 66.79710388183594,
+      "learning_rate": 3.7906633906633902e-06,
+      "loss": 8.7311,
+      "step": 3685
+    },
+    {
+      "epoch": 48.57142857142857,
+      "grad_norm": 83.55674743652344,
+      "learning_rate": 3.4122850122850124e-06,
+      "loss": 8.5959,
+      "step": 3740
+    }
+  ],
+  "logging_steps": 55,
+  "max_steps": 4235,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 55,
+  "save_steps": 220,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5.8876427477621146e+19,
+  "train_batch_size": 28,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3740/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99e55f6c266fb80fff7a194cd0925963d93d119d60f4443cb609bfd824b16fd5
+size 5841

checkpoint-3960/config.json ADDED Viewed

	@@ -0,0 +1,129 @@

+{
+  "activation_dropout": 0.0,
+  "activation_function": "silu",
+  "anchor_image_size": null,
+  "architectures": [
+    "RTDetrV2ForObjectDetection"
+  ],
+  "attention_dropout": 0.0,
+  "auxiliary_loss": true,
+  "backbone": null,
+  "backbone_config": {
+    "depths": [
+      3,
+      4,
+      23,
+      3
+    ],
+    "downsample_in_bottleneck": false,
+    "downsample_in_first_stage": false,
+    "embedding_size": 64,
+    "hidden_act": "relu",
+    "hidden_sizes": [
+      256,
+      512,
+      1024,
+      2048
+    ],
+    "layer_type": "bottleneck",
+    "model_type": "rt_detr_resnet",
+    "num_channels": 3,
+    "out_features": [
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "out_indices": [
+      2,
+      3,
+      4
+    ],
+    "stage_names": [
+      "stem",
+      "stage1",
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "torch_dtype": "float32"
+  },
+  "backbone_kwargs": null,
+  "batch_norm_eps": 1e-05,
+  "box_noise_scale": 1.0,
+  "d_model": 256,
+  "decoder_activation_function": "relu",
+  "decoder_attention_heads": 8,
+  "decoder_ffn_dim": 1024,
+  "decoder_in_channels": [
+    384,
+    384,
+    384
+  ],
+  "decoder_layers": 6,
+  "decoder_method": "default",
+  "decoder_n_levels": 3,
+  "decoder_n_points": 4,
+  "decoder_offset_scale": 0.5,
+  "disable_custom_kernels": true,
+  "dropout": 0.0,
+  "encode_proj_layers": [
+    2
+  ],
+  "encoder_activation_function": "gelu",
+  "encoder_attention_heads": 8,
+  "encoder_ffn_dim": 2048,
+  "encoder_hidden_dim": 384,
+  "encoder_in_channels": [
+    512,
+    1024,
+    2048
+  ],
+  "encoder_layers": 1,
+  "eos_coefficient": 0.0001,
+  "eval_size": null,
+  "feat_strides": [
+    8,
+    16,
+    32
+  ],
+  "focal_loss_alpha": 0.75,
+  "focal_loss_gamma": 2.0,
+  "freeze_backbone_batch_norms": true,
+  "hidden_expansion": 1.0,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_bias_prior_prob": null,
+  "initializer_range": 0.01,
+  "is_encoder_decoder": true,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "label_noise_ratio": 0.5,
+  "layer_norm_eps": 1e-05,
+  "learn_initial_query": false,
+  "matcher_alpha": 0.25,
+  "matcher_bbox_cost": 5.0,
+  "matcher_class_cost": 2.0,
+  "matcher_gamma": 2.0,
+  "matcher_giou_cost": 2.0,
+  "model_type": "rt_detr_v2",
+  "normalize_before": false,
+  "num_denoising": 100,
+  "num_feature_levels": 3,
+  "num_queries": 300,
+  "positional_encoding_temperature": 10000,
+  "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
+  "use_focal_loss": true,
+  "use_pretrained_backbone": false,
+  "use_timm_backbone": false,
+  "weight_loss_bbox": 5.0,
+  "weight_loss_giou": 2.0,
+  "weight_loss_vfl": 1.0,
+  "with_box_refine": true
+}

checkpoint-3960/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a0da8aa9a9dbf156ff61271506250c72336d8a6bd77ebdb2f058032615c467db
+size 306699044

checkpoint-3960/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:627c9c79f2991c364b1cd821ca8ca24dca3b10481c0b54ce39491f788f5e4659
+size 611580898

checkpoint-3960/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+  "do_convert_annotations": true,
+  "do_normalize": false,
+  "do_pad": false,
+  "do_rescale": true,
+  "do_resize": true,
+  "format": "coco_detection",
+  "image_mean": [
+    0.485,
+    0.456,
+    0.406
+  ],
+  "image_processor_type": "RTDetrImageProcessor",
+  "image_std": [
+    0.229,
+    0.224,
+    0.225
+  ],
+  "pad_size": null,
+  "resample": 2,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 640,
+    "width": 640
+  }
+}

checkpoint-3960/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff0ae4594f12a938934516f599b96c8fa1d052ac793f26e44ed839202dd42016
+size 14645

checkpoint-3960/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d866a08f2c164179018beb811aecb078e91850415968e1005b6ef3bd8128de66
+size 1465

checkpoint-3960/trainer_state.json ADDED Viewed

	@@ -0,0 +1,538 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 51.42857142857143,
+  "eval_steps": 500,
+  "global_step": 3960,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 4405.81884765625,
+      "learning_rate": 3.436363636363636e-07,
+      "loss": 1357.5645,
+      "step": 55
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 5894.37841796875,
+      "learning_rate": 6.936363636363637e-07,
+      "loss": 1290.9688,
+      "step": 110
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 3667.852294921875,
+      "learning_rate": 1.0436363636363635e-06,
+      "loss": 1140.9515,
+      "step": 165
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 3578.294677734375,
+      "learning_rate": 1.3936363636363637e-06,
+      "loss": 942.618,
+      "step": 220
+    },
+    {
+      "epoch": 3.571428571428571,
+      "grad_norm": 2097.637939453125,
+      "learning_rate": 1.7436363636363636e-06,
+      "loss": 721.2856,
+      "step": 275
+    },
+    {
+      "epoch": 4.285714285714286,
+      "grad_norm": 1840.612548828125,
+      "learning_rate": 2.0936363636363636e-06,
+      "loss": 525.8542,
+      "step": 330
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 1230.875,
+      "learning_rate": 2.4436363636363636e-06,
+      "loss": 397.7722,
+      "step": 385
+    },
+    {
+      "epoch": 5.714285714285714,
+      "grad_norm": 1280.699951171875,
+      "learning_rate": 2.7936363636363637e-06,
+      "loss": 313.8322,
+      "step": 440
+    },
+    {
+      "epoch": 6.428571428571429,
+      "grad_norm": 4265.28759765625,
+      "learning_rate": 3.1436363636363637e-06,
+      "loss": 254.1449,
+      "step": 495
+    },
+    {
+      "epoch": 7.142857142857143,
+      "grad_norm": 967.1757202148438,
+      "learning_rate": 3.4936363636363633e-06,
+      "loss": 218.4529,
+      "step": 550
+    },
+    {
+      "epoch": 7.857142857142857,
+      "grad_norm": 765.2302856445312,
+      "learning_rate": 3.843636363636364e-06,
+      "loss": 197.915,
+      "step": 605
+    },
+    {
+      "epoch": 8.571428571428571,
+      "grad_norm": 700.331787109375,
+      "learning_rate": 4.193636363636364e-06,
+      "loss": 170.9019,
+      "step": 660
+    },
+    {
+      "epoch": 9.285714285714286,
+      "grad_norm": 613.8758544921875,
+      "learning_rate": 4.543636363636363e-06,
+      "loss": 154.6195,
+      "step": 715
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3405.25732421875,
+      "learning_rate": 4.893636363636364e-06,
+      "loss": 136.8394,
+      "step": 770
+    },
+    {
+      "epoch": 10.714285714285714,
+      "grad_norm": 1219.8994140625,
+      "learning_rate": 5.243636363636364e-06,
+      "loss": 116.0246,
+      "step": 825
+    },
+    {
+      "epoch": 11.428571428571429,
+      "grad_norm": 306.2723083496094,
+      "learning_rate": 5.593636363636363e-06,
+      "loss": 104.2055,
+      "step": 880
+    },
+    {
+      "epoch": 12.142857142857142,
+      "grad_norm": 288.2547302246094,
+      "learning_rate": 5.943636363636364e-06,
+      "loss": 88.9812,
+      "step": 935
+    },
+    {
+      "epoch": 12.857142857142858,
+      "grad_norm": 1016.5924682617188,
+      "learning_rate": 6.293636363636363e-06,
+      "loss": 79.9017,
+      "step": 990
+    },
+    {
+      "epoch": 13.571428571428571,
+      "grad_norm": 239.49191284179688,
+      "learning_rate": 6.643636363636363e-06,
+      "loss": 73.6932,
+      "step": 1045
+    },
+    {
+      "epoch": 14.285714285714286,
+      "grad_norm": 193.92002868652344,
+      "learning_rate": 6.993636363636364e-06,
+      "loss": 62.2018,
+      "step": 1100
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 179.0568084716797,
+      "learning_rate": 7.343636363636363e-06,
+      "loss": 54.0213,
+      "step": 1155
+    },
+    {
+      "epoch": 15.714285714285714,
+      "grad_norm": 166.02944946289062,
+      "learning_rate": 7.693636363636364e-06,
+      "loss": 48.1955,
+      "step": 1210
+    },
+    {
+      "epoch": 16.428571428571427,
+      "grad_norm": 126.53916931152344,
+      "learning_rate": 8.043636363636364e-06,
+      "loss": 43.5431,
+      "step": 1265
+    },
+    {
+      "epoch": 17.142857142857142,
+      "grad_norm": 145.61166381835938,
+      "learning_rate": 8.393636363636363e-06,
+      "loss": 41.4399,
+      "step": 1320
+    },
+    {
+      "epoch": 17.857142857142858,
+      "grad_norm": 122.2297134399414,
+      "learning_rate": 8.743636363636363e-06,
+      "loss": 35.2278,
+      "step": 1375
+    },
+    {
+      "epoch": 18.571428571428573,
+      "grad_norm": 117.88919067382812,
+      "learning_rate": 9.093636363636363e-06,
+      "loss": 31.2827,
+      "step": 1430
+    },
+    {
+      "epoch": 19.285714285714285,
+      "grad_norm": 88.52986907958984,
+      "learning_rate": 9.443636363636364e-06,
+      "loss": 28.8076,
+      "step": 1485
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 88.49090576171875,
+      "learning_rate": 9.793636363636364e-06,
+      "loss": 28.232,
+      "step": 1540
+    },
+    {
+      "epoch": 20.714285714285715,
+      "grad_norm": 114.45001983642578,
+      "learning_rate": 1.0143636363636363e-05,
+      "loss": 26.0885,
+      "step": 1595
+    },
+    {
+      "epoch": 21.428571428571427,
+      "grad_norm": 74.16987609863281,
+      "learning_rate": 1.0493636363636363e-05,
+      "loss": 24.2689,
+      "step": 1650
+    },
+    {
+      "epoch": 22.142857142857142,
+      "grad_norm": 82.25133514404297,
+      "learning_rate": 1.0843636363636363e-05,
+      "loss": 22.6963,
+      "step": 1705
+    },
+    {
+      "epoch": 22.857142857142858,
+      "grad_norm": 74.76679229736328,
+      "learning_rate": 1.1193636363636363e-05,
+      "loss": 21.3257,
+      "step": 1760
+    },
+    {
+      "epoch": 23.571428571428573,
+      "grad_norm": 68.91163635253906,
+      "learning_rate": 1.1543636363636365e-05,
+      "loss": 20.2199,
+      "step": 1815
+    },
+    {
+      "epoch": 24.285714285714285,
+      "grad_norm": 59.86214828491211,
+      "learning_rate": 1.1893636363636363e-05,
+      "loss": 19.3769,
+      "step": 1870
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 76.9339370727539,
+      "learning_rate": 1.2243636363636363e-05,
+      "loss": 18.0471,
+      "step": 1925
+    },
+    {
+      "epoch": 25.714285714285715,
+      "grad_norm": 66.16152954101562,
+      "learning_rate": 1.2593636363636363e-05,
+      "loss": 17.496,
+      "step": 1980
+    },
+    {
+      "epoch": 26.428571428571427,
+      "grad_norm": 58.77778244018555,
+      "learning_rate": 1.2943636363636363e-05,
+      "loss": 16.9468,
+      "step": 2035
+    },
+    {
+      "epoch": 27.142857142857142,
+      "grad_norm": 71.95783233642578,
+      "learning_rate": 1.3293636363636363e-05,
+      "loss": 16.3026,
+      "step": 2090
+    },
+    {
+      "epoch": 27.857142857142858,
+      "grad_norm": 131.7191619873047,
+      "learning_rate": 1.3643636363636363e-05,
+      "loss": 16.008,
+      "step": 2145
+    },
+    {
+      "epoch": 28.571428571428573,
+      "grad_norm": 81.78388977050781,
+      "learning_rate": 1.3993636363636363e-05,
+      "loss": 15.4616,
+      "step": 2200
+    },
+    {
+      "epoch": 29.285714285714285,
+      "grad_norm": 60.10112380981445,
+      "learning_rate": 1.3628501228501228e-05,
+      "loss": 15.195,
+      "step": 2255
+    },
+    {
+      "epoch": 30.0,
+      "grad_norm": 77.59001922607422,
+      "learning_rate": 1.325012285012285e-05,
+      "loss": 14.7557,
+      "step": 2310
+    },
+    {
+      "epoch": 30.714285714285715,
+      "grad_norm": 77.3856201171875,
+      "learning_rate": 1.287174447174447e-05,
+      "loss": 14.2851,
+      "step": 2365
+    },
+    {
+      "epoch": 31.428571428571427,
+      "grad_norm": 73.75492095947266,
+      "learning_rate": 1.2493366093366094e-05,
+      "loss": 13.867,
+      "step": 2420
+    },
+    {
+      "epoch": 32.142857142857146,
+      "grad_norm": 78.76831817626953,
+      "learning_rate": 1.2114987714987713e-05,
+      "loss": 13.6677,
+      "step": 2475
+    },
+    {
+      "epoch": 32.857142857142854,
+      "grad_norm": 92.99346160888672,
+      "learning_rate": 1.1736609336609336e-05,
+      "loss": 13.1851,
+      "step": 2530
+    },
+    {
+      "epoch": 33.57142857142857,
+      "grad_norm": 97.57978820800781,
+      "learning_rate": 1.1358230958230958e-05,
+      "loss": 13.5215,
+      "step": 2585
+    },
+    {
+      "epoch": 34.285714285714285,
+      "grad_norm": 63.118141174316406,
+      "learning_rate": 1.0979852579852579e-05,
+      "loss": 12.8525,
+      "step": 2640
+    },
+    {
+      "epoch": 35.0,
+      "grad_norm": 63.68766403198242,
+      "learning_rate": 1.06014742014742e-05,
+      "loss": 12.441,
+      "step": 2695
+    },
+    {
+      "epoch": 35.714285714285715,
+      "grad_norm": 70.33533477783203,
+      "learning_rate": 1.0223095823095823e-05,
+      "loss": 12.2331,
+      "step": 2750
+    },
+    {
+      "epoch": 36.42857142857143,
+      "grad_norm": 64.16197967529297,
+      "learning_rate": 9.844717444717445e-06,
+      "loss": 11.7547,
+      "step": 2805
+    },
+    {
+      "epoch": 37.142857142857146,
+      "grad_norm": 85.83612823486328,
+      "learning_rate": 9.466339066339066e-06,
+      "loss": 11.8633,
+      "step": 2860
+    },
+    {
+      "epoch": 37.857142857142854,
+      "grad_norm": 89.40387725830078,
+      "learning_rate": 9.087960687960689e-06,
+      "loss": 11.5795,
+      "step": 2915
+    },
+    {
+      "epoch": 38.57142857142857,
+      "grad_norm": 76.38651275634766,
+      "learning_rate": 8.709582309582309e-06,
+      "loss": 11.334,
+      "step": 2970
+    },
+    {
+      "epoch": 39.285714285714285,
+      "grad_norm": 110.11483764648438,
+      "learning_rate": 8.331203931203932e-06,
+      "loss": 10.805,
+      "step": 3025
+    },
+    {
+      "epoch": 40.0,
+      "grad_norm": 60.31315612792969,
+      "learning_rate": 7.952825552825553e-06,
+      "loss": 10.9056,
+      "step": 3080
+    },
+    {
+      "epoch": 40.714285714285715,
+      "grad_norm": 107.96589660644531,
+      "learning_rate": 7.574447174447175e-06,
+      "loss": 10.5828,
+      "step": 3135
+    },
+    {
+      "epoch": 41.42857142857143,
+      "grad_norm": 74.8004379272461,
+      "learning_rate": 7.1960687960687955e-06,
+      "loss": 10.2818,
+      "step": 3190
+    },
+    {
+      "epoch": 42.142857142857146,
+      "grad_norm": 54.093475341796875,
+      "learning_rate": 6.817690417690418e-06,
+      "loss": 10.0785,
+      "step": 3245
+    },
+    {
+      "epoch": 42.857142857142854,
+      "grad_norm": 115.28564453125,
+      "learning_rate": 6.439312039312039e-06,
+      "loss": 9.8794,
+      "step": 3300
+    },
+    {
+      "epoch": 43.57142857142857,
+      "grad_norm": 52.57551956176758,
+      "learning_rate": 6.06093366093366e-06,
+      "loss": 9.7072,
+      "step": 3355
+    },
+    {
+      "epoch": 44.285714285714285,
+      "grad_norm": 51.994075775146484,
+      "learning_rate": 5.682555282555282e-06,
+      "loss": 9.6015,
+      "step": 3410
+    },
+    {
+      "epoch": 45.0,
+      "grad_norm": 73.08104705810547,
+      "learning_rate": 5.304176904176904e-06,
+      "loss": 9.305,
+      "step": 3465
+    },
+    {
+      "epoch": 45.714285714285715,
+      "grad_norm": 75.5807876586914,
+      "learning_rate": 4.925798525798525e-06,
+      "loss": 9.2281,
+      "step": 3520
+    },
+    {
+      "epoch": 46.42857142857143,
+      "grad_norm": 53.319637298583984,
+      "learning_rate": 4.547420147420147e-06,
+      "loss": 8.996,
+      "step": 3575
+    },
+    {
+      "epoch": 47.142857142857146,
+      "grad_norm": 72.28289794921875,
+      "learning_rate": 4.1690417690417685e-06,
+      "loss": 9.0072,
+      "step": 3630
+    },
+    {
+      "epoch": 47.857142857142854,
+      "grad_norm": 66.79710388183594,
+      "learning_rate": 3.7906633906633902e-06,
+      "loss": 8.7311,
+      "step": 3685
+    },
+    {
+      "epoch": 48.57142857142857,
+      "grad_norm": 83.55674743652344,
+      "learning_rate": 3.4122850122850124e-06,
+      "loss": 8.5959,
+      "step": 3740
+    },
+    {
+      "epoch": 49.285714285714285,
+      "grad_norm": 78.8072738647461,
+      "learning_rate": 3.0339066339066337e-06,
+      "loss": 8.5462,
+      "step": 3795
+    },
+    {
+      "epoch": 50.0,
+      "grad_norm": 102.47228240966797,
+      "learning_rate": 2.6555282555282554e-06,
+      "loss": 8.2928,
+      "step": 3850
+    },
+    {
+      "epoch": 50.714285714285715,
+      "grad_norm": 93.27884674072266,
+      "learning_rate": 2.277149877149877e-06,
+      "loss": 8.1427,
+      "step": 3905
+    },
+    {
+      "epoch": 51.42857142857143,
+      "grad_norm": 137.4209747314453,
+      "learning_rate": 1.8987714987714987e-06,
+      "loss": 8.164,
+      "step": 3960
+    }
+  ],
+  "logging_steps": 55,
+  "max_steps": 4235,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 55,
+  "save_steps": 220,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 6.2339349145809715e+19,
+  "train_batch_size": 28,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3960/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99e55f6c266fb80fff7a194cd0925963d93d119d60f4443cb609bfd824b16fd5
+size 5841

checkpoint-4180/config.json ADDED Viewed

	@@ -0,0 +1,129 @@

+{
+  "activation_dropout": 0.0,
+  "activation_function": "silu",
+  "anchor_image_size": null,
+  "architectures": [
+    "RTDetrV2ForObjectDetection"
+  ],
+  "attention_dropout": 0.0,
+  "auxiliary_loss": true,
+  "backbone": null,
+  "backbone_config": {
+    "depths": [
+      3,
+      4,
+      23,
+      3
+    ],
+    "downsample_in_bottleneck": false,
+    "downsample_in_first_stage": false,
+    "embedding_size": 64,
+    "hidden_act": "relu",
+    "hidden_sizes": [
+      256,
+      512,
+      1024,
+      2048
+    ],
+    "layer_type": "bottleneck",
+    "model_type": "rt_detr_resnet",
+    "num_channels": 3,
+    "out_features": [
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "out_indices": [
+      2,
+      3,
+      4
+    ],
+    "stage_names": [
+      "stem",
+      "stage1",
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "torch_dtype": "float32"
+  },
+  "backbone_kwargs": null,
+  "batch_norm_eps": 1e-05,
+  "box_noise_scale": 1.0,
+  "d_model": 256,
+  "decoder_activation_function": "relu",
+  "decoder_attention_heads": 8,
+  "decoder_ffn_dim": 1024,
+  "decoder_in_channels": [
+    384,
+    384,
+    384
+  ],
+  "decoder_layers": 6,
+  "decoder_method": "default",
+  "decoder_n_levels": 3,
+  "decoder_n_points": 4,
+  "decoder_offset_scale": 0.5,
+  "disable_custom_kernels": true,
+  "dropout": 0.0,
+  "encode_proj_layers": [
+    2
+  ],
+  "encoder_activation_function": "gelu",
+  "encoder_attention_heads": 8,
+  "encoder_ffn_dim": 2048,
+  "encoder_hidden_dim": 384,
+  "encoder_in_channels": [
+    512,
+    1024,
+    2048
+  ],
+  "encoder_layers": 1,
+  "eos_coefficient": 0.0001,
+  "eval_size": null,
+  "feat_strides": [
+    8,
+    16,
+    32
+  ],
+  "focal_loss_alpha": 0.75,
+  "focal_loss_gamma": 2.0,
+  "freeze_backbone_batch_norms": true,
+  "hidden_expansion": 1.0,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_bias_prior_prob": null,
+  "initializer_range": 0.01,
+  "is_encoder_decoder": true,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "label_noise_ratio": 0.5,
+  "layer_norm_eps": 1e-05,
+  "learn_initial_query": false,
+  "matcher_alpha": 0.25,
+  "matcher_bbox_cost": 5.0,
+  "matcher_class_cost": 2.0,
+  "matcher_gamma": 2.0,
+  "matcher_giou_cost": 2.0,
+  "model_type": "rt_detr_v2",
+  "normalize_before": false,
+  "num_denoising": 100,
+  "num_feature_levels": 3,
+  "num_queries": 300,
+  "positional_encoding_temperature": 10000,
+  "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
+  "use_focal_loss": true,
+  "use_pretrained_backbone": false,
+  "use_timm_backbone": false,
+  "weight_loss_bbox": 5.0,
+  "weight_loss_giou": 2.0,
+  "weight_loss_vfl": 1.0,
+  "with_box_refine": true
+}

checkpoint-4180/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7a3708ff7eb478f4d78afc03d6682682b88855ad74bd90d61a1f44bd6cbd9031
+size 306699044

checkpoint-4180/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c37e9d87c40ec6bec2836994bbdc85c72273474444714cbc9174eedffff8cbce
+size 611580898

checkpoint-4180/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+  "do_convert_annotations": true,
+  "do_normalize": false,
+  "do_pad": false,
+  "do_rescale": true,
+  "do_resize": true,
+  "format": "coco_detection",
+  "image_mean": [
+    0.485,
+    0.456,
+    0.406
+  ],
+  "image_processor_type": "RTDetrImageProcessor",
+  "image_std": [
+    0.229,
+    0.224,
+    0.225
+  ],
+  "pad_size": null,
+  "resample": 2,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 640,
+    "width": 640
+  }
+}

checkpoint-4180/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fa8987e65fa1b372b40e3601811f025fddf3af32827da76164d695e4a6697a78
+size 14645

checkpoint-4180/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f8a0d01e3953f2300825d40619ebf7431436db245ce8c643859c6c66bd4e6043
+size 1465

checkpoint-4180/trainer_state.json ADDED Viewed

	@@ -0,0 +1,566 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 54.285714285714285,
+  "eval_steps": 500,
+  "global_step": 4180,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 4405.81884765625,
+      "learning_rate": 3.436363636363636e-07,
+      "loss": 1357.5645,
+      "step": 55
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 5894.37841796875,
+      "learning_rate": 6.936363636363637e-07,
+      "loss": 1290.9688,
+      "step": 110
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 3667.852294921875,
+      "learning_rate": 1.0436363636363635e-06,
+      "loss": 1140.9515,
+      "step": 165
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 3578.294677734375,
+      "learning_rate": 1.3936363636363637e-06,
+      "loss": 942.618,
+      "step": 220
+    },
+    {
+      "epoch": 3.571428571428571,
+      "grad_norm": 2097.637939453125,
+      "learning_rate": 1.7436363636363636e-06,
+      "loss": 721.2856,
+      "step": 275
+    },
+    {
+      "epoch": 4.285714285714286,
+      "grad_norm": 1840.612548828125,
+      "learning_rate": 2.0936363636363636e-06,
+      "loss": 525.8542,
+      "step": 330
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 1230.875,
+      "learning_rate": 2.4436363636363636e-06,
+      "loss": 397.7722,
+      "step": 385
+    },
+    {
+      "epoch": 5.714285714285714,
+      "grad_norm": 1280.699951171875,
+      "learning_rate": 2.7936363636363637e-06,
+      "loss": 313.8322,
+      "step": 440
+    },
+    {
+      "epoch": 6.428571428571429,
+      "grad_norm": 4265.28759765625,
+      "learning_rate": 3.1436363636363637e-06,
+      "loss": 254.1449,
+      "step": 495
+    },
+    {
+      "epoch": 7.142857142857143,
+      "grad_norm": 967.1757202148438,
+      "learning_rate": 3.4936363636363633e-06,
+      "loss": 218.4529,
+      "step": 550
+    },
+    {
+      "epoch": 7.857142857142857,
+      "grad_norm": 765.2302856445312,
+      "learning_rate": 3.843636363636364e-06,
+      "loss": 197.915,
+      "step": 605
+    },
+    {
+      "epoch": 8.571428571428571,
+      "grad_norm": 700.331787109375,
+      "learning_rate": 4.193636363636364e-06,
+      "loss": 170.9019,
+      "step": 660
+    },
+    {
+      "epoch": 9.285714285714286,
+      "grad_norm": 613.8758544921875,
+      "learning_rate": 4.543636363636363e-06,
+      "loss": 154.6195,
+      "step": 715
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3405.25732421875,
+      "learning_rate": 4.893636363636364e-06,
+      "loss": 136.8394,
+      "step": 770
+    },
+    {
+      "epoch": 10.714285714285714,
+      "grad_norm": 1219.8994140625,
+      "learning_rate": 5.243636363636364e-06,
+      "loss": 116.0246,
+      "step": 825
+    },
+    {
+      "epoch": 11.428571428571429,
+      "grad_norm": 306.2723083496094,
+      "learning_rate": 5.593636363636363e-06,
+      "loss": 104.2055,
+      "step": 880
+    },
+    {
+      "epoch": 12.142857142857142,
+      "grad_norm": 288.2547302246094,
+      "learning_rate": 5.943636363636364e-06,
+      "loss": 88.9812,
+      "step": 935
+    },
+    {
+      "epoch": 12.857142857142858,
+      "grad_norm": 1016.5924682617188,
+      "learning_rate": 6.293636363636363e-06,
+      "loss": 79.9017,
+      "step": 990
+    },
+    {
+      "epoch": 13.571428571428571,
+      "grad_norm": 239.49191284179688,
+      "learning_rate": 6.643636363636363e-06,
+      "loss": 73.6932,
+      "step": 1045
+    },
+    {
+      "epoch": 14.285714285714286,
+      "grad_norm": 193.92002868652344,
+      "learning_rate": 6.993636363636364e-06,
+      "loss": 62.2018,
+      "step": 1100
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 179.0568084716797,
+      "learning_rate": 7.343636363636363e-06,
+      "loss": 54.0213,
+      "step": 1155
+    },
+    {
+      "epoch": 15.714285714285714,
+      "grad_norm": 166.02944946289062,
+      "learning_rate": 7.693636363636364e-06,
+      "loss": 48.1955,
+      "step": 1210
+    },
+    {
+      "epoch": 16.428571428571427,
+      "grad_norm": 126.53916931152344,
+      "learning_rate": 8.043636363636364e-06,
+      "loss": 43.5431,
+      "step": 1265
+    },
+    {
+      "epoch": 17.142857142857142,
+      "grad_norm": 145.61166381835938,
+      "learning_rate": 8.393636363636363e-06,
+      "loss": 41.4399,
+      "step": 1320
+    },
+    {
+      "epoch": 17.857142857142858,
+      "grad_norm": 122.2297134399414,
+      "learning_rate": 8.743636363636363e-06,
+      "loss": 35.2278,
+      "step": 1375
+    },
+    {
+      "epoch": 18.571428571428573,
+      "grad_norm": 117.88919067382812,
+      "learning_rate": 9.093636363636363e-06,
+      "loss": 31.2827,
+      "step": 1430
+    },
+    {
+      "epoch": 19.285714285714285,
+      "grad_norm": 88.52986907958984,
+      "learning_rate": 9.443636363636364e-06,
+      "loss": 28.8076,
+      "step": 1485
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 88.49090576171875,
+      "learning_rate": 9.793636363636364e-06,
+      "loss": 28.232,
+      "step": 1540
+    },
+    {
+      "epoch": 20.714285714285715,
+      "grad_norm": 114.45001983642578,
+      "learning_rate": 1.0143636363636363e-05,
+      "loss": 26.0885,
+      "step": 1595
+    },
+    {
+      "epoch": 21.428571428571427,
+      "grad_norm": 74.16987609863281,
+      "learning_rate": 1.0493636363636363e-05,
+      "loss": 24.2689,
+      "step": 1650
+    },
+    {
+      "epoch": 22.142857142857142,
+      "grad_norm": 82.25133514404297,
+      "learning_rate": 1.0843636363636363e-05,
+      "loss": 22.6963,
+      "step": 1705
+    },
+    {
+      "epoch": 22.857142857142858,
+      "grad_norm": 74.76679229736328,
+      "learning_rate": 1.1193636363636363e-05,
+      "loss": 21.3257,
+      "step": 1760
+    },
+    {
+      "epoch": 23.571428571428573,
+      "grad_norm": 68.91163635253906,
+      "learning_rate": 1.1543636363636365e-05,
+      "loss": 20.2199,
+      "step": 1815
+    },
+    {
+      "epoch": 24.285714285714285,
+      "grad_norm": 59.86214828491211,
+      "learning_rate": 1.1893636363636363e-05,
+      "loss": 19.3769,
+      "step": 1870
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 76.9339370727539,
+      "learning_rate": 1.2243636363636363e-05,
+      "loss": 18.0471,
+      "step": 1925
+    },
+    {
+      "epoch": 25.714285714285715,
+      "grad_norm": 66.16152954101562,
+      "learning_rate": 1.2593636363636363e-05,
+      "loss": 17.496,
+      "step": 1980
+    },
+    {
+      "epoch": 26.428571428571427,
+      "grad_norm": 58.77778244018555,
+      "learning_rate": 1.2943636363636363e-05,
+      "loss": 16.9468,
+      "step": 2035
+    },
+    {
+      "epoch": 27.142857142857142,
+      "grad_norm": 71.95783233642578,
+      "learning_rate": 1.3293636363636363e-05,
+      "loss": 16.3026,
+      "step": 2090
+    },
+    {
+      "epoch": 27.857142857142858,
+      "grad_norm": 131.7191619873047,
+      "learning_rate": 1.3643636363636363e-05,
+      "loss": 16.008,
+      "step": 2145
+    },
+    {
+      "epoch": 28.571428571428573,
+      "grad_norm": 81.78388977050781,
+      "learning_rate": 1.3993636363636363e-05,
+      "loss": 15.4616,
+      "step": 2200
+    },
+    {
+      "epoch": 29.285714285714285,
+      "grad_norm": 60.10112380981445,
+      "learning_rate": 1.3628501228501228e-05,
+      "loss": 15.195,
+      "step": 2255
+    },
+    {
+      "epoch": 30.0,
+      "grad_norm": 77.59001922607422,
+      "learning_rate": 1.325012285012285e-05,
+      "loss": 14.7557,
+      "step": 2310
+    },
+    {
+      "epoch": 30.714285714285715,
+      "grad_norm": 77.3856201171875,
+      "learning_rate": 1.287174447174447e-05,
+      "loss": 14.2851,
+      "step": 2365
+    },
+    {
+      "epoch": 31.428571428571427,
+      "grad_norm": 73.75492095947266,
+      "learning_rate": 1.2493366093366094e-05,
+      "loss": 13.867,
+      "step": 2420
+    },
+    {
+      "epoch": 32.142857142857146,
+      "grad_norm": 78.76831817626953,
+      "learning_rate": 1.2114987714987713e-05,
+      "loss": 13.6677,
+      "step": 2475
+    },
+    {
+      "epoch": 32.857142857142854,
+      "grad_norm": 92.99346160888672,
+      "learning_rate": 1.1736609336609336e-05,
+      "loss": 13.1851,
+      "step": 2530
+    },
+    {
+      "epoch": 33.57142857142857,
+      "grad_norm": 97.57978820800781,
+      "learning_rate": 1.1358230958230958e-05,
+      "loss": 13.5215,
+      "step": 2585
+    },
+    {
+      "epoch": 34.285714285714285,
+      "grad_norm": 63.118141174316406,
+      "learning_rate": 1.0979852579852579e-05,
+      "loss": 12.8525,
+      "step": 2640
+    },
+    {
+      "epoch": 35.0,
+      "grad_norm": 63.68766403198242,
+      "learning_rate": 1.06014742014742e-05,
+      "loss": 12.441,
+      "step": 2695
+    },
+    {
+      "epoch": 35.714285714285715,
+      "grad_norm": 70.33533477783203,
+      "learning_rate": 1.0223095823095823e-05,
+      "loss": 12.2331,
+      "step": 2750
+    },
+    {
+      "epoch": 36.42857142857143,
+      "grad_norm": 64.16197967529297,
+      "learning_rate": 9.844717444717445e-06,
+      "loss": 11.7547,
+      "step": 2805
+    },
+    {
+      "epoch": 37.142857142857146,
+      "grad_norm": 85.83612823486328,
+      "learning_rate": 9.466339066339066e-06,
+      "loss": 11.8633,
+      "step": 2860
+    },
+    {
+      "epoch": 37.857142857142854,
+      "grad_norm": 89.40387725830078,
+      "learning_rate": 9.087960687960689e-06,
+      "loss": 11.5795,
+      "step": 2915
+    },
+    {
+      "epoch": 38.57142857142857,
+      "grad_norm": 76.38651275634766,
+      "learning_rate": 8.709582309582309e-06,
+      "loss": 11.334,
+      "step": 2970
+    },
+    {
+      "epoch": 39.285714285714285,
+      "grad_norm": 110.11483764648438,
+      "learning_rate": 8.331203931203932e-06,
+      "loss": 10.805,
+      "step": 3025
+    },
+    {
+      "epoch": 40.0,
+      "grad_norm": 60.31315612792969,
+      "learning_rate": 7.952825552825553e-06,
+      "loss": 10.9056,
+      "step": 3080
+    },
+    {
+      "epoch": 40.714285714285715,
+      "grad_norm": 107.96589660644531,
+      "learning_rate": 7.574447174447175e-06,
+      "loss": 10.5828,
+      "step": 3135
+    },
+    {
+      "epoch": 41.42857142857143,
+      "grad_norm": 74.8004379272461,
+      "learning_rate": 7.1960687960687955e-06,
+      "loss": 10.2818,
+      "step": 3190
+    },
+    {
+      "epoch": 42.142857142857146,
+      "grad_norm": 54.093475341796875,
+      "learning_rate": 6.817690417690418e-06,
+      "loss": 10.0785,
+      "step": 3245
+    },
+    {
+      "epoch": 42.857142857142854,
+      "grad_norm": 115.28564453125,
+      "learning_rate": 6.439312039312039e-06,
+      "loss": 9.8794,
+      "step": 3300
+    },
+    {
+      "epoch": 43.57142857142857,
+      "grad_norm": 52.57551956176758,
+      "learning_rate": 6.06093366093366e-06,
+      "loss": 9.7072,
+      "step": 3355
+    },
+    {
+      "epoch": 44.285714285714285,
+      "grad_norm": 51.994075775146484,
+      "learning_rate": 5.682555282555282e-06,
+      "loss": 9.6015,
+      "step": 3410
+    },
+    {
+      "epoch": 45.0,
+      "grad_norm": 73.08104705810547,
+      "learning_rate": 5.304176904176904e-06,
+      "loss": 9.305,
+      "step": 3465
+    },
+    {
+      "epoch": 45.714285714285715,
+      "grad_norm": 75.5807876586914,
+      "learning_rate": 4.925798525798525e-06,
+      "loss": 9.2281,
+      "step": 3520
+    },
+    {
+      "epoch": 46.42857142857143,
+      "grad_norm": 53.319637298583984,
+      "learning_rate": 4.547420147420147e-06,
+      "loss": 8.996,
+      "step": 3575
+    },
+    {
+      "epoch": 47.142857142857146,
+      "grad_norm": 72.28289794921875,
+      "learning_rate": 4.1690417690417685e-06,
+      "loss": 9.0072,
+      "step": 3630
+    },
+    {
+      "epoch": 47.857142857142854,
+      "grad_norm": 66.79710388183594,
+      "learning_rate": 3.7906633906633902e-06,
+      "loss": 8.7311,
+      "step": 3685
+    },
+    {
+      "epoch": 48.57142857142857,
+      "grad_norm": 83.55674743652344,
+      "learning_rate": 3.4122850122850124e-06,
+      "loss": 8.5959,
+      "step": 3740
+    },
+    {
+      "epoch": 49.285714285714285,
+      "grad_norm": 78.8072738647461,
+      "learning_rate": 3.0339066339066337e-06,
+      "loss": 8.5462,
+      "step": 3795
+    },
+    {
+      "epoch": 50.0,
+      "grad_norm": 102.47228240966797,
+      "learning_rate": 2.6555282555282554e-06,
+      "loss": 8.2928,
+      "step": 3850
+    },
+    {
+      "epoch": 50.714285714285715,
+      "grad_norm": 93.27884674072266,
+      "learning_rate": 2.277149877149877e-06,
+      "loss": 8.1427,
+      "step": 3905
+    },
+    {
+      "epoch": 51.42857142857143,
+      "grad_norm": 137.4209747314453,
+      "learning_rate": 1.8987714987714987e-06,
+      "loss": 8.164,
+      "step": 3960
+    },
+    {
+      "epoch": 52.142857142857146,
+      "grad_norm": 38.38957214355469,
+      "learning_rate": 1.5203931203931202e-06,
+      "loss": 7.8464,
+      "step": 4015
+    },
+    {
+      "epoch": 52.857142857142854,
+      "grad_norm": 63.25676727294922,
+      "learning_rate": 1.1420147420147421e-06,
+      "loss": 7.8844,
+      "step": 4070
+    },
+    {
+      "epoch": 53.57142857142857,
+      "grad_norm": 46.60155487060547,
+      "learning_rate": 7.636363636363636e-07,
+      "loss": 7.5751,
+      "step": 4125
+    },
+    {
+      "epoch": 54.285714285714285,
+      "grad_norm": 56.5892448425293,
+      "learning_rate": 3.8525798525798526e-07,
+      "loss": 7.7376,
+      "step": 4180
+    }
+  ],
+  "logging_steps": 55,
+  "max_steps": 4235,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 55,
+  "save_steps": 220,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 6.5802270813998285e+19,
+  "train_batch_size": 28,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-4180/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99e55f6c266fb80fff7a194cd0925963d93d119d60f4443cb609bfd824b16fd5
+size 5841

checkpoint-4235/config.json ADDED Viewed

	@@ -0,0 +1,129 @@

+{
+  "activation_dropout": 0.0,
+  "activation_function": "silu",
+  "anchor_image_size": null,
+  "architectures": [
+    "RTDetrV2ForObjectDetection"
+  ],
+  "attention_dropout": 0.0,
+  "auxiliary_loss": true,
+  "backbone": null,
+  "backbone_config": {
+    "depths": [
+      3,
+      4,
+      23,
+      3
+    ],
+    "downsample_in_bottleneck": false,
+    "downsample_in_first_stage": false,
+    "embedding_size": 64,
+    "hidden_act": "relu",
+    "hidden_sizes": [
+      256,
+      512,
+      1024,
+      2048
+    ],
+    "layer_type": "bottleneck",
+    "model_type": "rt_detr_resnet",
+    "num_channels": 3,
+    "out_features": [
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "out_indices": [
+      2,
+      3,
+      4
+    ],
+    "stage_names": [
+      "stem",
+      "stage1",
+      "stage2",
+      "stage3",
+      "stage4"
+    ],
+    "torch_dtype": "float32"
+  },
+  "backbone_kwargs": null,
+  "batch_norm_eps": 1e-05,
+  "box_noise_scale": 1.0,
+  "d_model": 256,
+  "decoder_activation_function": "relu",
+  "decoder_attention_heads": 8,
+  "decoder_ffn_dim": 1024,
+  "decoder_in_channels": [
+    384,
+    384,
+    384
+  ],
+  "decoder_layers": 6,
+  "decoder_method": "default",
+  "decoder_n_levels": 3,
+  "decoder_n_points": 4,
+  "decoder_offset_scale": 0.5,
+  "disable_custom_kernels": true,
+  "dropout": 0.0,
+  "encode_proj_layers": [
+    2
+  ],
+  "encoder_activation_function": "gelu",
+  "encoder_attention_heads": 8,
+  "encoder_ffn_dim": 2048,
+  "encoder_hidden_dim": 384,
+  "encoder_in_channels": [
+    512,
+    1024,
+    2048
+  ],
+  "encoder_layers": 1,
+  "eos_coefficient": 0.0001,
+  "eval_size": null,
+  "feat_strides": [
+    8,
+    16,
+    32
+  ],
+  "focal_loss_alpha": 0.75,
+  "focal_loss_gamma": 2.0,
+  "freeze_backbone_batch_norms": true,
+  "hidden_expansion": 1.0,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2"
+  },
+  "initializer_bias_prior_prob": null,
+  "initializer_range": 0.01,
+  "is_encoder_decoder": true,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2
+  },
+  "label_noise_ratio": 0.5,
+  "layer_norm_eps": 1e-05,
+  "learn_initial_query": false,
+  "matcher_alpha": 0.25,
+  "matcher_bbox_cost": 5.0,
+  "matcher_class_cost": 2.0,
+  "matcher_gamma": 2.0,
+  "matcher_giou_cost": 2.0,
+  "model_type": "rt_detr_v2",
+  "normalize_before": false,
+  "num_denoising": 100,
+  "num_feature_levels": 3,
+  "num_queries": 300,
+  "positional_encoding_temperature": 10000,
+  "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
+  "use_focal_loss": true,
+  "use_pretrained_backbone": false,
+  "use_timm_backbone": false,
+  "weight_loss_bbox": 5.0,
+  "weight_loss_giou": 2.0,
+  "weight_loss_vfl": 1.0,
+  "with_box_refine": true
+}

checkpoint-4235/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a93c80de10ffd31fe782054b3e02c6be5b97bb74ab13990ee1c9c50346f43fba
+size 306699044

checkpoint-4235/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:97305cabfe1039400d2343d85b38ae0e37694a3e342a6319f2687d14ec72953e
+size 611580898

checkpoint-4235/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+  "do_convert_annotations": true,
+  "do_normalize": false,
+  "do_pad": false,
+  "do_rescale": true,
+  "do_resize": true,
+  "format": "coco_detection",
+  "image_mean": [
+    0.485,
+    0.456,
+    0.406
+  ],
+  "image_processor_type": "RTDetrImageProcessor",
+  "image_std": [
+    0.229,
+    0.224,
+    0.225
+  ],
+  "pad_size": null,
+  "resample": 2,
+  "rescale_factor": 0.00392156862745098,
+  "size": {
+    "height": 640,
+    "width": 640
+  }
+}

checkpoint-4235/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:52710090d6cfecdf10ea9486a80f6062200f2525471ac4971080093c461ef84c
+size 14645

checkpoint-4235/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f961f56765e0678d862d847e28c6b1236181897dd1cc787bb5549277ecbd035c
+size 1465

checkpoint-4235/trainer_state.json ADDED Viewed

	@@ -0,0 +1,573 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 55.0,
+  "eval_steps": 500,
+  "global_step": 4235,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 4405.81884765625,
+      "learning_rate": 3.436363636363636e-07,
+      "loss": 1357.5645,
+      "step": 55
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 5894.37841796875,
+      "learning_rate": 6.936363636363637e-07,
+      "loss": 1290.9688,
+      "step": 110
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 3667.852294921875,
+      "learning_rate": 1.0436363636363635e-06,
+      "loss": 1140.9515,
+      "step": 165
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 3578.294677734375,
+      "learning_rate": 1.3936363636363637e-06,
+      "loss": 942.618,
+      "step": 220
+    },
+    {
+      "epoch": 3.571428571428571,
+      "grad_norm": 2097.637939453125,
+      "learning_rate": 1.7436363636363636e-06,
+      "loss": 721.2856,
+      "step": 275
+    },
+    {
+      "epoch": 4.285714285714286,
+      "grad_norm": 1840.612548828125,
+      "learning_rate": 2.0936363636363636e-06,
+      "loss": 525.8542,
+      "step": 330
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 1230.875,
+      "learning_rate": 2.4436363636363636e-06,
+      "loss": 397.7722,
+      "step": 385
+    },
+    {
+      "epoch": 5.714285714285714,
+      "grad_norm": 1280.699951171875,
+      "learning_rate": 2.7936363636363637e-06,
+      "loss": 313.8322,
+      "step": 440
+    },
+    {
+      "epoch": 6.428571428571429,
+      "grad_norm": 4265.28759765625,
+      "learning_rate": 3.1436363636363637e-06,
+      "loss": 254.1449,
+      "step": 495
+    },
+    {
+      "epoch": 7.142857142857143,
+      "grad_norm": 967.1757202148438,
+      "learning_rate": 3.4936363636363633e-06,
+      "loss": 218.4529,
+      "step": 550
+    },
+    {
+      "epoch": 7.857142857142857,
+      "grad_norm": 765.2302856445312,
+      "learning_rate": 3.843636363636364e-06,
+      "loss": 197.915,
+      "step": 605
+    },
+    {
+      "epoch": 8.571428571428571,
+      "grad_norm": 700.331787109375,
+      "learning_rate": 4.193636363636364e-06,
+      "loss": 170.9019,
+      "step": 660
+    },
+    {
+      "epoch": 9.285714285714286,
+      "grad_norm": 613.8758544921875,
+      "learning_rate": 4.543636363636363e-06,
+      "loss": 154.6195,
+      "step": 715
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3405.25732421875,
+      "learning_rate": 4.893636363636364e-06,
+      "loss": 136.8394,
+      "step": 770
+    },
+    {
+      "epoch": 10.714285714285714,
+      "grad_norm": 1219.8994140625,
+      "learning_rate": 5.243636363636364e-06,
+      "loss": 116.0246,
+      "step": 825
+    },
+    {
+      "epoch": 11.428571428571429,
+      "grad_norm": 306.2723083496094,
+      "learning_rate": 5.593636363636363e-06,
+      "loss": 104.2055,
+      "step": 880
+    },
+    {
+      "epoch": 12.142857142857142,
+      "grad_norm": 288.2547302246094,
+      "learning_rate": 5.943636363636364e-06,
+      "loss": 88.9812,
+      "step": 935
+    },
+    {
+      "epoch": 12.857142857142858,
+      "grad_norm": 1016.5924682617188,
+      "learning_rate": 6.293636363636363e-06,
+      "loss": 79.9017,
+      "step": 990
+    },
+    {
+      "epoch": 13.571428571428571,
+      "grad_norm": 239.49191284179688,
+      "learning_rate": 6.643636363636363e-06,
+      "loss": 73.6932,
+      "step": 1045
+    },
+    {
+      "epoch": 14.285714285714286,
+      "grad_norm": 193.92002868652344,
+      "learning_rate": 6.993636363636364e-06,
+      "loss": 62.2018,
+      "step": 1100
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 179.0568084716797,
+      "learning_rate": 7.343636363636363e-06,
+      "loss": 54.0213,
+      "step": 1155
+    },
+    {
+      "epoch": 15.714285714285714,
+      "grad_norm": 166.02944946289062,
+      "learning_rate": 7.693636363636364e-06,
+      "loss": 48.1955,
+      "step": 1210
+    },
+    {
+      "epoch": 16.428571428571427,
+      "grad_norm": 126.53916931152344,
+      "learning_rate": 8.043636363636364e-06,
+      "loss": 43.5431,
+      "step": 1265
+    },
+    {
+      "epoch": 17.142857142857142,
+      "grad_norm": 145.61166381835938,
+      "learning_rate": 8.393636363636363e-06,
+      "loss": 41.4399,
+      "step": 1320
+    },
+    {
+      "epoch": 17.857142857142858,
+      "grad_norm": 122.2297134399414,
+      "learning_rate": 8.743636363636363e-06,
+      "loss": 35.2278,
+      "step": 1375
+    },
+    {
+      "epoch": 18.571428571428573,
+      "grad_norm": 117.88919067382812,
+      "learning_rate": 9.093636363636363e-06,
+      "loss": 31.2827,
+      "step": 1430
+    },
+    {
+      "epoch": 19.285714285714285,
+      "grad_norm": 88.52986907958984,
+      "learning_rate": 9.443636363636364e-06,
+      "loss": 28.8076,
+      "step": 1485
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 88.49090576171875,
+      "learning_rate": 9.793636363636364e-06,
+      "loss": 28.232,
+      "step": 1540
+    },
+    {
+      "epoch": 20.714285714285715,
+      "grad_norm": 114.45001983642578,
+      "learning_rate": 1.0143636363636363e-05,
+      "loss": 26.0885,
+      "step": 1595
+    },
+    {
+      "epoch": 21.428571428571427,
+      "grad_norm": 74.16987609863281,
+      "learning_rate": 1.0493636363636363e-05,
+      "loss": 24.2689,
+      "step": 1650
+    },
+    {
+      "epoch": 22.142857142857142,
+      "grad_norm": 82.25133514404297,
+      "learning_rate": 1.0843636363636363e-05,
+      "loss": 22.6963,
+      "step": 1705
+    },
+    {
+      "epoch": 22.857142857142858,
+      "grad_norm": 74.76679229736328,
+      "learning_rate": 1.1193636363636363e-05,
+      "loss": 21.3257,
+      "step": 1760
+    },
+    {
+      "epoch": 23.571428571428573,
+      "grad_norm": 68.91163635253906,
+      "learning_rate": 1.1543636363636365e-05,
+      "loss": 20.2199,
+      "step": 1815
+    },
+    {
+      "epoch": 24.285714285714285,
+      "grad_norm": 59.86214828491211,
+      "learning_rate": 1.1893636363636363e-05,
+      "loss": 19.3769,
+      "step": 1870
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 76.9339370727539,
+      "learning_rate": 1.2243636363636363e-05,
+      "loss": 18.0471,
+      "step": 1925
+    },
+    {
+      "epoch": 25.714285714285715,
+      "grad_norm": 66.16152954101562,
+      "learning_rate": 1.2593636363636363e-05,
+      "loss": 17.496,
+      "step": 1980
+    },
+    {
+      "epoch": 26.428571428571427,
+      "grad_norm": 58.77778244018555,
+      "learning_rate": 1.2943636363636363e-05,
+      "loss": 16.9468,
+      "step": 2035
+    },
+    {
+      "epoch": 27.142857142857142,
+      "grad_norm": 71.95783233642578,
+      "learning_rate": 1.3293636363636363e-05,
+      "loss": 16.3026,
+      "step": 2090
+    },
+    {
+      "epoch": 27.857142857142858,
+      "grad_norm": 131.7191619873047,
+      "learning_rate": 1.3643636363636363e-05,
+      "loss": 16.008,
+      "step": 2145
+    },
+    {
+      "epoch": 28.571428571428573,
+      "grad_norm": 81.78388977050781,
+      "learning_rate": 1.3993636363636363e-05,
+      "loss": 15.4616,
+      "step": 2200
+    },
+    {
+      "epoch": 29.285714285714285,
+      "grad_norm": 60.10112380981445,
+      "learning_rate": 1.3628501228501228e-05,
+      "loss": 15.195,
+      "step": 2255
+    },
+    {
+      "epoch": 30.0,
+      "grad_norm": 77.59001922607422,
+      "learning_rate": 1.325012285012285e-05,
+      "loss": 14.7557,
+      "step": 2310
+    },
+    {
+      "epoch": 30.714285714285715,
+      "grad_norm": 77.3856201171875,
+      "learning_rate": 1.287174447174447e-05,
+      "loss": 14.2851,
+      "step": 2365
+    },
+    {
+      "epoch": 31.428571428571427,
+      "grad_norm": 73.75492095947266,
+      "learning_rate": 1.2493366093366094e-05,
+      "loss": 13.867,
+      "step": 2420
+    },
+    {
+      "epoch": 32.142857142857146,
+      "grad_norm": 78.76831817626953,
+      "learning_rate": 1.2114987714987713e-05,
+      "loss": 13.6677,
+      "step": 2475
+    },
+    {
+      "epoch": 32.857142857142854,
+      "grad_norm": 92.99346160888672,
+      "learning_rate": 1.1736609336609336e-05,
+      "loss": 13.1851,
+      "step": 2530
+    },
+    {
+      "epoch": 33.57142857142857,
+      "grad_norm": 97.57978820800781,
+      "learning_rate": 1.1358230958230958e-05,
+      "loss": 13.5215,
+      "step": 2585
+    },
+    {
+      "epoch": 34.285714285714285,
+      "grad_norm": 63.118141174316406,
+      "learning_rate": 1.0979852579852579e-05,
+      "loss": 12.8525,
+      "step": 2640
+    },
+    {
+      "epoch": 35.0,
+      "grad_norm": 63.68766403198242,
+      "learning_rate": 1.06014742014742e-05,
+      "loss": 12.441,
+      "step": 2695
+    },
+    {
+      "epoch": 35.714285714285715,
+      "grad_norm": 70.33533477783203,
+      "learning_rate": 1.0223095823095823e-05,
+      "loss": 12.2331,
+      "step": 2750
+    },
+    {
+      "epoch": 36.42857142857143,
+      "grad_norm": 64.16197967529297,
+      "learning_rate": 9.844717444717445e-06,
+      "loss": 11.7547,
+      "step": 2805
+    },
+    {
+      "epoch": 37.142857142857146,
+      "grad_norm": 85.83612823486328,
+      "learning_rate": 9.466339066339066e-06,
+      "loss": 11.8633,
+      "step": 2860
+    },
+    {
+      "epoch": 37.857142857142854,
+      "grad_norm": 89.40387725830078,
+      "learning_rate": 9.087960687960689e-06,
+      "loss": 11.5795,
+      "step": 2915
+    },
+    {
+      "epoch": 38.57142857142857,
+      "grad_norm": 76.38651275634766,
+      "learning_rate": 8.709582309582309e-06,
+      "loss": 11.334,
+      "step": 2970
+    },
+    {
+      "epoch": 39.285714285714285,
+      "grad_norm": 110.11483764648438,
+      "learning_rate": 8.331203931203932e-06,
+      "loss": 10.805,
+      "step": 3025
+    },
+    {
+      "epoch": 40.0,
+      "grad_norm": 60.31315612792969,
+      "learning_rate": 7.952825552825553e-06,
+      "loss": 10.9056,
+      "step": 3080
+    },
+    {
+      "epoch": 40.714285714285715,
+      "grad_norm": 107.96589660644531,
+      "learning_rate": 7.574447174447175e-06,
+      "loss": 10.5828,
+      "step": 3135
+    },
+    {
+      "epoch": 41.42857142857143,
+      "grad_norm": 74.8004379272461,
+      "learning_rate": 7.1960687960687955e-06,
+      "loss": 10.2818,
+      "step": 3190
+    },
+    {
+      "epoch": 42.142857142857146,
+      "grad_norm": 54.093475341796875,
+      "learning_rate": 6.817690417690418e-06,
+      "loss": 10.0785,
+      "step": 3245
+    },
+    {
+      "epoch": 42.857142857142854,
+      "grad_norm": 115.28564453125,
+      "learning_rate": 6.439312039312039e-06,
+      "loss": 9.8794,
+      "step": 3300
+    },
+    {
+      "epoch": 43.57142857142857,
+      "grad_norm": 52.57551956176758,
+      "learning_rate": 6.06093366093366e-06,
+      "loss": 9.7072,
+      "step": 3355
+    },
+    {
+      "epoch": 44.285714285714285,
+      "grad_norm": 51.994075775146484,
+      "learning_rate": 5.682555282555282e-06,
+      "loss": 9.6015,
+      "step": 3410
+    },
+    {
+      "epoch": 45.0,
+      "grad_norm": 73.08104705810547,
+      "learning_rate": 5.304176904176904e-06,
+      "loss": 9.305,
+      "step": 3465
+    },
+    {
+      "epoch": 45.714285714285715,
+      "grad_norm": 75.5807876586914,
+      "learning_rate": 4.925798525798525e-06,
+      "loss": 9.2281,
+      "step": 3520
+    },
+    {
+      "epoch": 46.42857142857143,
+      "grad_norm": 53.319637298583984,
+      "learning_rate": 4.547420147420147e-06,
+      "loss": 8.996,
+      "step": 3575
+    },
+    {
+      "epoch": 47.142857142857146,
+      "grad_norm": 72.28289794921875,
+      "learning_rate": 4.1690417690417685e-06,
+      "loss": 9.0072,
+      "step": 3630
+    },
+    {
+      "epoch": 47.857142857142854,
+      "grad_norm": 66.79710388183594,
+      "learning_rate": 3.7906633906633902e-06,
+      "loss": 8.7311,
+      "step": 3685
+    },
+    {
+      "epoch": 48.57142857142857,
+      "grad_norm": 83.55674743652344,
+      "learning_rate": 3.4122850122850124e-06,
+      "loss": 8.5959,
+      "step": 3740
+    },
+    {
+      "epoch": 49.285714285714285,
+      "grad_norm": 78.8072738647461,
+      "learning_rate": 3.0339066339066337e-06,
+      "loss": 8.5462,
+      "step": 3795
+    },
+    {
+      "epoch": 50.0,
+      "grad_norm": 102.47228240966797,
+      "learning_rate": 2.6555282555282554e-06,
+      "loss": 8.2928,
+      "step": 3850
+    },
+    {
+      "epoch": 50.714285714285715,
+      "grad_norm": 93.27884674072266,
+      "learning_rate": 2.277149877149877e-06,
+      "loss": 8.1427,
+      "step": 3905
+    },
+    {
+      "epoch": 51.42857142857143,
+      "grad_norm": 137.4209747314453,
+      "learning_rate": 1.8987714987714987e-06,
+      "loss": 8.164,
+      "step": 3960
+    },
+    {
+      "epoch": 52.142857142857146,
+      "grad_norm": 38.38957214355469,
+      "learning_rate": 1.5203931203931202e-06,
+      "loss": 7.8464,
+      "step": 4015
+    },
+    {
+      "epoch": 52.857142857142854,
+      "grad_norm": 63.25676727294922,
+      "learning_rate": 1.1420147420147421e-06,
+      "loss": 7.8844,
+      "step": 4070
+    },
+    {
+      "epoch": 53.57142857142857,
+      "grad_norm": 46.60155487060547,
+      "learning_rate": 7.636363636363636e-07,
+      "loss": 7.5751,
+      "step": 4125
+    },
+    {
+      "epoch": 54.285714285714285,
+      "grad_norm": 56.5892448425293,
+      "learning_rate": 3.8525798525798526e-07,
+      "loss": 7.7376,
+      "step": 4180
+    },
+    {
+      "epoch": 55.0,
+      "grad_norm": 87.8992919921875,
+      "learning_rate": 6.879606879606879e-09,
+      "loss": 7.5818,
+      "step": 4235
+    }
+  ],
+  "logging_steps": 55,
+  "max_steps": 4235,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 55,
+  "save_steps": 220,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 6.666743797117747e+19,
+  "train_batch_size": 28,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-4235/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:99e55f6c266fb80fff7a194cd0925963d93d119d60f4443cb609bfd824b16fd5
+size 5841

config.json CHANGED Viewed

@@ -118,7 +118,7 @@
   "num_queries": 300,
   "positional_encoding_temperature": 10000,
   "torch_dtype": "float32",
-  "transformers_version": "4.55.0",
   "use_focal_loss": true,
   "use_pretrained_backbone": false,
   "use_timm_backbone": false,

   "num_queries": 300,
   "positional_encoding_temperature": 10000,
   "torch_dtype": "float32",
+  "transformers_version": "4.55.2",
   "use_focal_loss": true,
   "use_pretrained_backbone": false,
   "use_timm_backbone": false,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3a52d4cd4386295eedbfb267bc679eca4b27864d745fff06694c0f9dbf823a6
 size 306699044

 version https://git-lfs.github.com/spec/v1
+oid sha256:a93c80de10ffd31fe782054b3e02c6be5b97bb74ab13990ee1c9c50346f43fba
 size 306699044

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a7b84367094b7487f77de50fba614a6c6667e9cf018b77ee5bfc158268fc5eaf
-size 5368

 version https://git-lfs.github.com/spec/v1
+oid sha256:99e55f6c266fb80fff7a194cd0925963d93d119d60f4443cb609bfd824b16fd5
+size 5841