jnmrr commited on
Commit
fbe6e50
·
verified ·
1 Parent(s): 3f85937

Upload RT-DETRv2 voucher classifier

Browse files
README.md CHANGED
@@ -74,6 +74,33 @@ This model is a fine-tuned version of [PekingU/rtdetr_v2_r101vd](https://hugging
74
 
75
  **Final Evaluation Results:**
76
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
77
  **Model Configuration:**
78
  - **Base model**: PekingU/rtdetr_v2_r101vd
79
  - **Architecture**: rtdetr_v2_r101vd
@@ -90,12 +117,13 @@ This model is a fine-tuned version of [PekingU/rtdetr_v2_r101vd](https://hugging
90
  **Training Time**: 0.6 minutes
91
 
92
  **Training Summary:**
93
- - **Final training loss**: 1361.9480
 
94
 
95
 
96
  ### MLflow Tracking
97
 
98
- - **MLflow Run ID**: 65eb62e7fd564f99981143809773def8
99
  - **MLflow Experiment**: RT-DETRv2_Voucher_Classification
100
 
101
 
 
74
 
75
  **Final Evaluation Results:**
76
 
77
+
78
+ **Overall Detection Performance:**
79
+ - **mAP**: 0.0000
80
+ - **mAP@50**: 0.0000
81
+ - **mAP@75**: 0.0000
82
+
83
+ **Per-Class Average Precision:**
84
+ - **Digital invoices**: 0.0000 (needs improvement)
85
+ - **Fisico receipts**: 0.0000 (needs improvement)
86
+ - **Tesoreria receipts**: 0.0000 (needs improvement)
87
+
88
+ **Model Confidence:**
89
+ - **Digital invoices mean confidence**: 0.7041 (moderate)
90
+ - **Fisico receipts mean confidence**: 0.5998 (low)
91
+ - **Tesoreria receipts mean confidence**: 0.5715 (low)
92
+
93
+ **Performance by Object Size:**
94
+ - **Small objects**: 0.0000
95
+ - **Medium objects**: -1.0000
96
+ - **Large objects**: 0.0000
97
+
98
+ **Evaluation Dataset:**
99
+ - **Digital invoices**: 157 samples (28.5%)
100
+ - **Fisico receipts**: 261 samples (47.4%)
101
+ - **Tesoreria receipts**: 133 samples (24.1%)
102
+ - **Total evaluation samples**: 551
103
+
104
  **Model Configuration:**
105
  - **Base model**: PekingU/rtdetr_v2_r101vd
106
  - **Architecture**: rtdetr_v2_r101vd
 
117
  **Training Time**: 0.6 minutes
118
 
119
  **Training Summary:**
120
+ - **Final training loss**: 1361.6241
121
+ - **Final learning rate**: 1.43e-07
122
 
123
 
124
  ### MLflow Tracking
125
 
126
+ - **MLflow Run ID**: 0bf1954e36da45088455964384408885
127
  - **MLflow Experiment**: RT-DETRv2_Voucher_Classification
128
 
129
 
checkpoint-11/config.json ADDED
@@ -0,0 +1,129 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_dropout": 0.0,
3
+ "activation_function": "silu",
4
+ "anchor_image_size": null,
5
+ "architectures": [
6
+ "RTDetrV2ForObjectDetection"
7
+ ],
8
+ "attention_dropout": 0.0,
9
+ "auxiliary_loss": true,
10
+ "backbone": null,
11
+ "backbone_config": {
12
+ "depths": [
13
+ 3,
14
+ 4,
15
+ 23,
16
+ 3
17
+ ],
18
+ "downsample_in_bottleneck": false,
19
+ "downsample_in_first_stage": false,
20
+ "embedding_size": 64,
21
+ "hidden_act": "relu",
22
+ "hidden_sizes": [
23
+ 256,
24
+ 512,
25
+ 1024,
26
+ 2048
27
+ ],
28
+ "layer_type": "bottleneck",
29
+ "model_type": "rt_detr_resnet",
30
+ "num_channels": 3,
31
+ "out_features": [
32
+ "stage2",
33
+ "stage3",
34
+ "stage4"
35
+ ],
36
+ "out_indices": [
37
+ 2,
38
+ 3,
39
+ 4
40
+ ],
41
+ "stage_names": [
42
+ "stem",
43
+ "stage1",
44
+ "stage2",
45
+ "stage3",
46
+ "stage4"
47
+ ],
48
+ "torch_dtype": "float32"
49
+ },
50
+ "backbone_kwargs": null,
51
+ "batch_norm_eps": 1e-05,
52
+ "box_noise_scale": 1.0,
53
+ "d_model": 256,
54
+ "decoder_activation_function": "relu",
55
+ "decoder_attention_heads": 8,
56
+ "decoder_ffn_dim": 1024,
57
+ "decoder_in_channels": [
58
+ 384,
59
+ 384,
60
+ 384
61
+ ],
62
+ "decoder_layers": 6,
63
+ "decoder_method": "default",
64
+ "decoder_n_levels": 3,
65
+ "decoder_n_points": 4,
66
+ "decoder_offset_scale": 0.5,
67
+ "disable_custom_kernels": true,
68
+ "dropout": 0.0,
69
+ "encode_proj_layers": [
70
+ 2
71
+ ],
72
+ "encoder_activation_function": "gelu",
73
+ "encoder_attention_heads": 8,
74
+ "encoder_ffn_dim": 2048,
75
+ "encoder_hidden_dim": 384,
76
+ "encoder_in_channels": [
77
+ 512,
78
+ 1024,
79
+ 2048
80
+ ],
81
+ "encoder_layers": 1,
82
+ "eos_coefficient": 0.0001,
83
+ "eval_size": null,
84
+ "feat_strides": [
85
+ 8,
86
+ 16,
87
+ 32
88
+ ],
89
+ "focal_loss_alpha": 0.75,
90
+ "focal_loss_gamma": 2.0,
91
+ "freeze_backbone_batch_norms": true,
92
+ "hidden_expansion": 1.0,
93
+ "id2label": {
94
+ "0": "LABEL_0",
95
+ "1": "LABEL_1",
96
+ "2": "LABEL_2"
97
+ },
98
+ "initializer_bias_prior_prob": null,
99
+ "initializer_range": 0.01,
100
+ "is_encoder_decoder": true,
101
+ "label2id": {
102
+ "LABEL_0": 0,
103
+ "LABEL_1": 1,
104
+ "LABEL_2": 2
105
+ },
106
+ "label_noise_ratio": 0.5,
107
+ "layer_norm_eps": 1e-05,
108
+ "learn_initial_query": false,
109
+ "matcher_alpha": 0.25,
110
+ "matcher_bbox_cost": 5.0,
111
+ "matcher_class_cost": 2.0,
112
+ "matcher_gamma": 2.0,
113
+ "matcher_giou_cost": 2.0,
114
+ "model_type": "rt_detr_v2",
115
+ "normalize_before": false,
116
+ "num_denoising": 100,
117
+ "num_feature_levels": 3,
118
+ "num_queries": 300,
119
+ "positional_encoding_temperature": 10000,
120
+ "torch_dtype": "float32",
121
+ "transformers_version": "4.55.0",
122
+ "use_focal_loss": true,
123
+ "use_pretrained_backbone": false,
124
+ "use_timm_backbone": false,
125
+ "weight_loss_bbox": 5.0,
126
+ "weight_loss_giou": 2.0,
127
+ "weight_loss_vfl": 1.0,
128
+ "with_box_refine": true
129
+ }
checkpoint-11/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e3e068bda225fc31bb49ed7183a789b37bd93976d6a96831e17aa015749abd1
3
+ size 306699044
checkpoint-11/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87dabdb27f4f90cb9270ced17931fcd21fa54ed6e3e1e9639cdf5c810f120e43
3
+ size 611580433
checkpoint-11/preprocessor_config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_annotations": true,
3
+ "do_normalize": false,
4
+ "do_pad": false,
5
+ "do_rescale": true,
6
+ "do_resize": true,
7
+ "format": "coco_detection",
8
+ "image_mean": [
9
+ 0.485,
10
+ 0.456,
11
+ 0.406
12
+ ],
13
+ "image_processor_type": "RTDetrImageProcessor",
14
+ "image_std": [
15
+ 0.229,
16
+ 0.224,
17
+ 0.225
18
+ ],
19
+ "pad_size": null,
20
+ "resample": 2,
21
+ "rescale_factor": 0.00392156862745098,
22
+ "size": {
23
+ "height": 640,
24
+ "width": 640
25
+ }
26
+ }
checkpoint-11/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:485c3e554af1b9085b3c02357f2e127e19bd275a84ebb30b1fb13fd4d5d20bb3
3
+ size 14244
checkpoint-11/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99e8799425df17af4b2976f77dd0c9b3661c7dfc83e78d7f432f2f7e04f3e76a
3
+ size 1064
checkpoint-11/trainer_state.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 1.0,
6
+ "eval_steps": 500,
7
+ "global_step": 11,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.47619047619047616,
14
+ "grad_norm": 5716.10205078125,
15
+ "learning_rate": 3.0000000000000004e-08,
16
+ "loss": 1383.1007,
17
+ "step": 5
18
+ },
19
+ {
20
+ "epoch": 0.9523809523809523,
21
+ "grad_norm": 12343.9111328125,
22
+ "learning_rate": 6.75e-08,
23
+ "loss": 1349.0135,
24
+ "step": 10
25
+ }
26
+ ],
27
+ "logging_steps": 5,
28
+ "max_steps": 22,
29
+ "num_input_tokens_seen": 0,
30
+ "num_train_epochs": 2,
31
+ "save_steps": 500,
32
+ "stateful_callbacks": {
33
+ "TrainerControl": {
34
+ "args": {
35
+ "should_epoch_stop": false,
36
+ "should_evaluate": false,
37
+ "should_log": false,
38
+ "should_save": true,
39
+ "should_training_stop": false
40
+ },
41
+ "attributes": {}
42
+ }
43
+ },
44
+ "total_flos": 2.816299339776e+17,
45
+ "train_batch_size": 24,
46
+ "trial_name": null,
47
+ "trial_params": null
48
+ }
checkpoint-11/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1180767f5de13a6a025f0c99a50dc82acaeafd2f978f6044f91019e1561dc92
3
+ size 5368
checkpoint-22/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41bcea9c8faca4547536af694dd5ad4a304153763de5c5d40387fb9d71bedb70
3
  size 306699044
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88ca34ef98d20cb695317e3577b14ccd8027ea4cfe525424549bd643cd07258d
3
  size 306699044
checkpoint-22/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:443919119e128db40e45a79d6a18a299f9ef64236143bc3b0a00dc2b02f890c4
3
  size 611580433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53bdea1aaa6c5b3169bdf07cc3b8a586e5a2917de523de9504f1bf309d1e6fef
3
  size 611580433
checkpoint-22/trainer_state.json CHANGED
@@ -3,17 +3,46 @@
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
  "epoch": 2.0,
6
- "eval_steps": 100,
7
  "global_step": 22,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
- "log_history": [],
12
- "logging_steps": 50,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  "max_steps": 22,
14
  "num_input_tokens_seen": 0,
15
  "num_train_epochs": 2,
16
- "save_steps": 200,
17
  "stateful_callbacks": {
18
  "TrainerControl": {
19
  "args": {
 
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
  "epoch": 2.0,
6
+ "eval_steps": 500,
7
  "global_step": 22,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.47619047619047616,
14
+ "grad_norm": 5716.10205078125,
15
+ "learning_rate": 3.0000000000000004e-08,
16
+ "loss": 1383.1007,
17
+ "step": 5
18
+ },
19
+ {
20
+ "epoch": 0.9523809523809523,
21
+ "grad_norm": 12343.9111328125,
22
+ "learning_rate": 6.75e-08,
23
+ "loss": 1349.0135,
24
+ "step": 10
25
+ },
26
+ {
27
+ "epoch": 1.380952380952381,
28
+ "grad_norm": 10210.48046875,
29
+ "learning_rate": 1.05e-07,
30
+ "loss": 1340.3351,
31
+ "step": 15
32
+ },
33
+ {
34
+ "epoch": 1.8571428571428572,
35
+ "grad_norm": 7633.39599609375,
36
+ "learning_rate": 1.425e-07,
37
+ "loss": 1369.3844,
38
+ "step": 20
39
+ }
40
+ ],
41
+ "logging_steps": 5,
42
  "max_steps": 22,
43
  "num_input_tokens_seen": 0,
44
  "num_train_epochs": 2,
45
+ "save_steps": 500,
46
  "stateful_callbacks": {
47
  "TrainerControl": {
48
  "args": {
checkpoint-22/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee47b52e482bd2dc4e70d1d92d8db4b33fc8cc8bb349a91709c9f357b574e2d1
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1180767f5de13a6a025f0c99a50dc82acaeafd2f978f6044f91019e1561dc92
3
  size 5368
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41bcea9c8faca4547536af694dd5ad4a304153763de5c5d40387fb9d71bedb70
3
  size 306699044
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88ca34ef98d20cb695317e3577b14ccd8027ea4cfe525424549bd643cd07258d
3
  size 306699044
runs/Aug14_00-31-34_9db0f8c974d2/events.out.tfevents.1755131495.9db0f8c974d2.97819.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9da04950d3bca5c43a7a018693a7d06aa8974c8ef4f8712c9e9a73ffe62f1669
3
+ size 8224
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee47b52e482bd2dc4e70d1d92d8db4b33fc8cc8bb349a91709c9f357b574e2d1
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1180767f5de13a6a025f0c99a50dc82acaeafd2f978f6044f91019e1561dc92
3
  size 5368