prithivMLmods commited on
Commit
5c5ce01
·
verified ·
1 Parent(s): a3c5e18

Upload folder using huggingface_hub

Browse files
checkpoint-1012/config.json ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "SiglipForImageClassification"
4
+ ],
5
+ "id2label": {
6
+ "0": "\u090b",
7
+ "1": "\u0915",
8
+ "2": "\u0916",
9
+ "3": "\u0917",
10
+ "4": "\u0918",
11
+ "5": "\u0919",
12
+ "6": "\u091a",
13
+ "7": "\u091b",
14
+ "8": "\u091c",
15
+ "9": "\u091d",
16
+ "10": "\u091f",
17
+ "11": "\u0920",
18
+ "12": "\u0922",
19
+ "13": "\u0923",
20
+ "14": "\u0924",
21
+ "15": "\u0925",
22
+ "16": "\u0926",
23
+ "17": "\u0928",
24
+ "18": "\u092a",
25
+ "19": "\u092b",
26
+ "20": "\u092c",
27
+ "21": "\u092d",
28
+ "22": "\u092e",
29
+ "23": "\u092f",
30
+ "24": "\u0930",
31
+ "25": "\u0932",
32
+ "26": "\u0935",
33
+ "27": "\u0938",
34
+ "28": "\u0939"
35
+ },
36
+ "initializer_factor": 1.0,
37
+ "label2id": {
38
+ "\u090b": 0,
39
+ "\u0915": 1,
40
+ "\u0916": 2,
41
+ "\u0917": 3,
42
+ "\u0918": 4,
43
+ "\u0919": 5,
44
+ "\u091a": 6,
45
+ "\u091b": 7,
46
+ "\u091c": 8,
47
+ "\u091d": 9,
48
+ "\u091f": 10,
49
+ "\u0920": 11,
50
+ "\u0922": 12,
51
+ "\u0923": 13,
52
+ "\u0924": 14,
53
+ "\u0925": 15,
54
+ "\u0926": 16,
55
+ "\u0928": 17,
56
+ "\u092a": 18,
57
+ "\u092b": 19,
58
+ "\u092c": 20,
59
+ "\u092d": 21,
60
+ "\u092e": 22,
61
+ "\u092f": 23,
62
+ "\u0930": 24,
63
+ "\u0932": 25,
64
+ "\u0935": 26,
65
+ "\u0938": 27,
66
+ "\u0939": 28
67
+ },
68
+ "model_type": "siglip",
69
+ "problem_type": "single_label_classification",
70
+ "text_config": {
71
+ "attention_dropout": 0.0,
72
+ "hidden_act": "gelu_pytorch_tanh",
73
+ "hidden_size": 768,
74
+ "intermediate_size": 3072,
75
+ "layer_norm_eps": 1e-06,
76
+ "max_position_embeddings": 64,
77
+ "model_type": "siglip_text_model",
78
+ "num_attention_heads": 12,
79
+ "num_hidden_layers": 12,
80
+ "projection_size": 768,
81
+ "torch_dtype": "float32",
82
+ "vocab_size": 256000
83
+ },
84
+ "torch_dtype": "float32",
85
+ "transformers_version": "4.50.0",
86
+ "vision_config": {
87
+ "attention_dropout": 0.0,
88
+ "hidden_act": "gelu_pytorch_tanh",
89
+ "hidden_size": 768,
90
+ "image_size": 224,
91
+ "intermediate_size": 3072,
92
+ "layer_norm_eps": 1e-06,
93
+ "model_type": "siglip_vision_model",
94
+ "num_attention_heads": 12,
95
+ "num_channels": 3,
96
+ "num_hidden_layers": 12,
97
+ "patch_size": 16,
98
+ "torch_dtype": "float32"
99
+ }
100
+ }
checkpoint-1012/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eeed8acb82365002266bf98361ceebe19f9b74d7c885c5c8854bb58082b85b5
3
+ size 371651052
checkpoint-1012/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ab5ec3029daa57091d26102843cc6f8836441fb1ec8c16e2d2fddf7a9962410
3
+ size 686721786
checkpoint-1012/preprocessor_config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": null,
3
+ "do_normalize": true,
4
+ "do_rescale": true,
5
+ "do_resize": true,
6
+ "image_mean": [
7
+ 0.5,
8
+ 0.5,
9
+ 0.5
10
+ ],
11
+ "image_processor_type": "SiglipImageProcessor",
12
+ "image_std": [
13
+ 0.5,
14
+ 0.5,
15
+ 0.5
16
+ ],
17
+ "processor_class": "SiglipProcessor",
18
+ "resample": 2,
19
+ "rescale_factor": 0.00392156862745098,
20
+ "size": {
21
+ "height": 224,
22
+ "width": 224
23
+ }
24
+ }
checkpoint-1012/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60dcddd0310ead2325fb47c425ece444a249bce9a834f715a65aba50af7e4e65
3
+ size 14244
checkpoint-1012/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6a3d4b07dce2a397d81d3bb6d2ef9dfe1be3b5c8b1421b9e8b8a06fb1bda866
3
+ size 1064
checkpoint-1012/trainer_state.json ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": 1012,
3
+ "best_metric": 0.18154847621917725,
4
+ "best_model_checkpoint": "siglip2-finetune-full/checkpoint-1012",
5
+ "epoch": 2.0,
6
+ "eval_steps": 500,
7
+ "global_step": 1012,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.9881422924901185,
14
+ "grad_norm": 7.464842796325684,
15
+ "learning_rate": 0.0002661122661122661,
16
+ "loss": 1.5544,
17
+ "step": 500
18
+ },
19
+ {
20
+ "epoch": 1.0,
21
+ "eval_accuracy": 0.6886938245657415,
22
+ "eval_loss": 0.9519435167312622,
23
+ "eval_model_preparation_time": 0.0026,
24
+ "eval_runtime": 216.1541,
25
+ "eval_samples_per_second": 74.84,
26
+ "eval_steps_per_second": 9.359,
27
+ "step": 506
28
+ },
29
+ {
30
+ "epoch": 1.9762845849802373,
31
+ "grad_norm": 4.09387731552124,
32
+ "learning_rate": 6.237006237006238e-06,
33
+ "loss": 0.3209,
34
+ "step": 1000
35
+ },
36
+ {
37
+ "epoch": 2.0,
38
+ "eval_accuracy": 0.942510972368177,
39
+ "eval_loss": 0.18154847621917725,
40
+ "eval_model_preparation_time": 0.0026,
41
+ "eval_runtime": 211.4297,
42
+ "eval_samples_per_second": 76.512,
43
+ "eval_steps_per_second": 9.568,
44
+ "step": 1012
45
+ }
46
+ ],
47
+ "logging_steps": 500,
48
+ "max_steps": 1012,
49
+ "num_input_tokens_seen": 0,
50
+ "num_train_epochs": 2,
51
+ "save_steps": 500,
52
+ "stateful_callbacks": {
53
+ "TrainerControl": {
54
+ "args": {
55
+ "should_epoch_stop": false,
56
+ "should_evaluate": false,
57
+ "should_log": false,
58
+ "should_save": true,
59
+ "should_training_stop": true
60
+ },
61
+ "attributes": {}
62
+ }
63
+ },
64
+ "total_flos": 2.7104320294495396e+18,
65
+ "train_batch_size": 32,
66
+ "trial_name": null,
67
+ "trial_params": null
68
+ }
checkpoint-1012/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13c09778d5590b0474b689b82857e5d45343043143dcc53e05f5cce8ccfc8a9d
3
+ size 5304
checkpoint-506/config.json ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "SiglipForImageClassification"
4
+ ],
5
+ "id2label": {
6
+ "0": "\u090b",
7
+ "1": "\u0915",
8
+ "2": "\u0916",
9
+ "3": "\u0917",
10
+ "4": "\u0918",
11
+ "5": "\u0919",
12
+ "6": "\u091a",
13
+ "7": "\u091b",
14
+ "8": "\u091c",
15
+ "9": "\u091d",
16
+ "10": "\u091f",
17
+ "11": "\u0920",
18
+ "12": "\u0922",
19
+ "13": "\u0923",
20
+ "14": "\u0924",
21
+ "15": "\u0925",
22
+ "16": "\u0926",
23
+ "17": "\u0928",
24
+ "18": "\u092a",
25
+ "19": "\u092b",
26
+ "20": "\u092c",
27
+ "21": "\u092d",
28
+ "22": "\u092e",
29
+ "23": "\u092f",
30
+ "24": "\u0930",
31
+ "25": "\u0932",
32
+ "26": "\u0935",
33
+ "27": "\u0938",
34
+ "28": "\u0939"
35
+ },
36
+ "initializer_factor": 1.0,
37
+ "label2id": {
38
+ "\u090b": 0,
39
+ "\u0915": 1,
40
+ "\u0916": 2,
41
+ "\u0917": 3,
42
+ "\u0918": 4,
43
+ "\u0919": 5,
44
+ "\u091a": 6,
45
+ "\u091b": 7,
46
+ "\u091c": 8,
47
+ "\u091d": 9,
48
+ "\u091f": 10,
49
+ "\u0920": 11,
50
+ "\u0922": 12,
51
+ "\u0923": 13,
52
+ "\u0924": 14,
53
+ "\u0925": 15,
54
+ "\u0926": 16,
55
+ "\u0928": 17,
56
+ "\u092a": 18,
57
+ "\u092b": 19,
58
+ "\u092c": 20,
59
+ "\u092d": 21,
60
+ "\u092e": 22,
61
+ "\u092f": 23,
62
+ "\u0930": 24,
63
+ "\u0932": 25,
64
+ "\u0935": 26,
65
+ "\u0938": 27,
66
+ "\u0939": 28
67
+ },
68
+ "model_type": "siglip",
69
+ "problem_type": "single_label_classification",
70
+ "text_config": {
71
+ "attention_dropout": 0.0,
72
+ "hidden_act": "gelu_pytorch_tanh",
73
+ "hidden_size": 768,
74
+ "intermediate_size": 3072,
75
+ "layer_norm_eps": 1e-06,
76
+ "max_position_embeddings": 64,
77
+ "model_type": "siglip_text_model",
78
+ "num_attention_heads": 12,
79
+ "num_hidden_layers": 12,
80
+ "projection_size": 768,
81
+ "torch_dtype": "float32",
82
+ "vocab_size": 256000
83
+ },
84
+ "torch_dtype": "float32",
85
+ "transformers_version": "4.50.0",
86
+ "vision_config": {
87
+ "attention_dropout": 0.0,
88
+ "hidden_act": "gelu_pytorch_tanh",
89
+ "hidden_size": 768,
90
+ "image_size": 224,
91
+ "intermediate_size": 3072,
92
+ "layer_norm_eps": 1e-06,
93
+ "model_type": "siglip_vision_model",
94
+ "num_attention_heads": 12,
95
+ "num_channels": 3,
96
+ "num_hidden_layers": 12,
97
+ "patch_size": 16,
98
+ "torch_dtype": "float32"
99
+ }
100
+ }
checkpoint-506/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa903d122e259342a46c3ac081f8d19563114eb9bb7db7c5bfdb67d24a62bdd4
3
+ size 371651052
checkpoint-506/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cb0a64e7796e9eb478c5cf7570b66552e509a93c10adbf0505432dda9765b3a
3
+ size 686721786
checkpoint-506/preprocessor_config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": null,
3
+ "do_normalize": true,
4
+ "do_rescale": true,
5
+ "do_resize": true,
6
+ "image_mean": [
7
+ 0.5,
8
+ 0.5,
9
+ 0.5
10
+ ],
11
+ "image_processor_type": "SiglipImageProcessor",
12
+ "image_std": [
13
+ 0.5,
14
+ 0.5,
15
+ 0.5
16
+ ],
17
+ "processor_class": "SiglipProcessor",
18
+ "resample": 2,
19
+ "rescale_factor": 0.00392156862745098,
20
+ "size": {
21
+ "height": 224,
22
+ "width": 224
23
+ }
24
+ }
checkpoint-506/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c7a3ff1649e401d94a91becbafa8d11f11d4e193fd044acf4e7235db5744c68
3
+ size 14244
checkpoint-506/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2314145c30e33e8a87c3dc43ed7c74c396737c2ecc3740d8dca1984b5a8e2ab6
3
+ size 1064
checkpoint-506/trainer_state.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": 506,
3
+ "best_metric": 0.9519435167312622,
4
+ "best_model_checkpoint": "siglip2-finetune-full/checkpoint-506",
5
+ "epoch": 1.0,
6
+ "eval_steps": 500,
7
+ "global_step": 506,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 0.9881422924901185,
14
+ "grad_norm": 7.464842796325684,
15
+ "learning_rate": 0.0002661122661122661,
16
+ "loss": 1.5544,
17
+ "step": 500
18
+ },
19
+ {
20
+ "epoch": 1.0,
21
+ "eval_accuracy": 0.6886938245657415,
22
+ "eval_loss": 0.9519435167312622,
23
+ "eval_model_preparation_time": 0.0026,
24
+ "eval_runtime": 216.1541,
25
+ "eval_samples_per_second": 74.84,
26
+ "eval_steps_per_second": 9.359,
27
+ "step": 506
28
+ }
29
+ ],
30
+ "logging_steps": 500,
31
+ "max_steps": 1012,
32
+ "num_input_tokens_seen": 0,
33
+ "num_train_epochs": 2,
34
+ "save_steps": 500,
35
+ "stateful_callbacks": {
36
+ "TrainerControl": {
37
+ "args": {
38
+ "should_epoch_stop": false,
39
+ "should_evaluate": false,
40
+ "should_log": false,
41
+ "should_save": true,
42
+ "should_training_stop": false
43
+ },
44
+ "attributes": {}
45
+ }
46
+ },
47
+ "total_flos": 1.3552160147247698e+18,
48
+ "train_batch_size": 32,
49
+ "trial_name": null,
50
+ "trial_params": null
51
+ }
checkpoint-506/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13c09778d5590b0474b689b82857e5d45343043143dcc53e05f5cce8ccfc8a9d
3
+ size 5304
config.json ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "SiglipForImageClassification"
4
+ ],
5
+ "id2label": {
6
+ "0": "\u090b",
7
+ "1": "\u0915",
8
+ "2": "\u0916",
9
+ "3": "\u0917",
10
+ "4": "\u0918",
11
+ "5": "\u0919",
12
+ "6": "\u091a",
13
+ "7": "\u091b",
14
+ "8": "\u091c",
15
+ "9": "\u091d",
16
+ "10": "\u091f",
17
+ "11": "\u0920",
18
+ "12": "\u0922",
19
+ "13": "\u0923",
20
+ "14": "\u0924",
21
+ "15": "\u0925",
22
+ "16": "\u0926",
23
+ "17": "\u0928",
24
+ "18": "\u092a",
25
+ "19": "\u092b",
26
+ "20": "\u092c",
27
+ "21": "\u092d",
28
+ "22": "\u092e",
29
+ "23": "\u092f",
30
+ "24": "\u0930",
31
+ "25": "\u0932",
32
+ "26": "\u0935",
33
+ "27": "\u0938",
34
+ "28": "\u0939"
35
+ },
36
+ "initializer_factor": 1.0,
37
+ "label2id": {
38
+ "\u090b": 0,
39
+ "\u0915": 1,
40
+ "\u0916": 2,
41
+ "\u0917": 3,
42
+ "\u0918": 4,
43
+ "\u0919": 5,
44
+ "\u091a": 6,
45
+ "\u091b": 7,
46
+ "\u091c": 8,
47
+ "\u091d": 9,
48
+ "\u091f": 10,
49
+ "\u0920": 11,
50
+ "\u0922": 12,
51
+ "\u0923": 13,
52
+ "\u0924": 14,
53
+ "\u0925": 15,
54
+ "\u0926": 16,
55
+ "\u0928": 17,
56
+ "\u092a": 18,
57
+ "\u092b": 19,
58
+ "\u092c": 20,
59
+ "\u092d": 21,
60
+ "\u092e": 22,
61
+ "\u092f": 23,
62
+ "\u0930": 24,
63
+ "\u0932": 25,
64
+ "\u0935": 26,
65
+ "\u0938": 27,
66
+ "\u0939": 28
67
+ },
68
+ "model_type": "siglip",
69
+ "problem_type": "single_label_classification",
70
+ "text_config": {
71
+ "attention_dropout": 0.0,
72
+ "hidden_act": "gelu_pytorch_tanh",
73
+ "hidden_size": 768,
74
+ "intermediate_size": 3072,
75
+ "layer_norm_eps": 1e-06,
76
+ "max_position_embeddings": 64,
77
+ "model_type": "siglip_text_model",
78
+ "num_attention_heads": 12,
79
+ "num_hidden_layers": 12,
80
+ "projection_size": 768,
81
+ "torch_dtype": "float32",
82
+ "vocab_size": 256000
83
+ },
84
+ "torch_dtype": "float32",
85
+ "transformers_version": "4.50.0",
86
+ "vision_config": {
87
+ "attention_dropout": 0.0,
88
+ "hidden_act": "gelu_pytorch_tanh",
89
+ "hidden_size": 768,
90
+ "image_size": 224,
91
+ "intermediate_size": 3072,
92
+ "layer_norm_eps": 1e-06,
93
+ "model_type": "siglip_vision_model",
94
+ "num_attention_heads": 12,
95
+ "num_channels": 3,
96
+ "num_hidden_layers": 12,
97
+ "patch_size": 16,
98
+ "torch_dtype": "float32"
99
+ }
100
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4eeed8acb82365002266bf98361ceebe19f9b74d7c885c5c8854bb58082b85b5
3
+ size 371651052
preprocessor_config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": null,
3
+ "do_normalize": true,
4
+ "do_rescale": true,
5
+ "do_resize": true,
6
+ "image_mean": [
7
+ 0.5,
8
+ 0.5,
9
+ 0.5
10
+ ],
11
+ "image_processor_type": "SiglipImageProcessor",
12
+ "image_std": [
13
+ 0.5,
14
+ 0.5,
15
+ 0.5
16
+ ],
17
+ "processor_class": "SiglipProcessor",
18
+ "resample": 2,
19
+ "rescale_factor": 0.00392156862745098,
20
+ "size": {
21
+ "height": 224,
22
+ "width": 224
23
+ }
24
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13c09778d5590b0474b689b82857e5d45343043143dcc53e05f5cce8ccfc8a9d
3
+ size 5304