karishmathakrar commited on
Commit
faa6ebc
·
verified ·
1 Parent(s): 3fd859b

Training in progress, epoch 0

Browse files
Files changed (25) hide show
  1. .gitattributes +1 -0
  2. adapter_config.json +40 -0
  3. adapter_model.safetensors +3 -0
  4. added_tokens.json +4 -0
  5. chat_template.json +3 -0
  6. preprocessor_config.json +29 -0
  7. processor_config.json +4 -0
  8. runs/Apr09_14-03-47_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744222380.atl1-1-01-006-9-0.pace.gatech.edu.3411561.0 +3 -0
  9. runs/Apr09_14-59-17_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744225163.atl1-1-01-006-9-0.pace.gatech.edu.3411561.1 +3 -0
  10. runs/Apr09_15-18-23_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744226306.atl1-1-01-006-9-0.pace.gatech.edu.3411561.2 +3 -0
  11. runs/Apr09_15-21-21_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744226484.atl1-1-01-006-9-0.pace.gatech.edu.3411561.3 +3 -0
  12. runs/Apr09_15-23-48_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744226630.atl1-1-01-006-9-0.pace.gatech.edu.3411561.4 +3 -0
  13. runs/Apr09_15-23-48_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744227057.atl1-1-01-006-9-0.pace.gatech.edu.3411561.5 +3 -0
  14. runs/Apr09_15-23-48_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744227155.atl1-1-01-006-9-0.pace.gatech.edu.3411561.6 +3 -0
  15. runs/Apr09_15-23-48_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744227298.atl1-1-01-006-9-0.pace.gatech.edu.3411561.7 +3 -0
  16. runs/Apr09_16-37-05_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744231027.atl1-1-01-006-9-0.pace.gatech.edu.3640142.0 +3 -0
  17. runs/Apr09_16-39-06_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744231148.atl1-1-01-006-9-0.pace.gatech.edu.3640142.1 +3 -0
  18. runs/Apr09_18-08-18_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744236505.atl1-1-01-006-9-0.pace.gatech.edu.3640142.2 +3 -0
  19. runs/Apr09_18-12-59_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744236781.atl1-1-01-006-9-0.pace.gatech.edu.3640142.3 +3 -0
  20. runs/Apr09_18-16-24_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744236987.atl1-1-01-006-9-0.pace.gatech.edu.3640142.4 +3 -0
  21. special_tokens_map.json +42 -0
  22. tokenizer.json +3 -0
  23. tokenizer.model +3 -0
  24. tokenizer_config.json +0 -0
  25. training_args.bin +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
adapter_config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "google/gemma-3-4b-pt",
5
+ "bias": "none",
6
+ "eva_config": null,
7
+ "exclude_modules": null,
8
+ "fan_in_fan_out": false,
9
+ "inference_mode": true,
10
+ "init_lora_weights": true,
11
+ "layer_replication": null,
12
+ "layers_pattern": null,
13
+ "layers_to_transform": null,
14
+ "loftq_config": {},
15
+ "lora_alpha": 16,
16
+ "lora_bias": false,
17
+ "lora_dropout": 0.05,
18
+ "megatron_config": null,
19
+ "megatron_core": "megatron.core",
20
+ "modules_to_save": [
21
+ "lm_head",
22
+ "embed_tokens"
23
+ ],
24
+ "peft_type": "LORA",
25
+ "r": 16,
26
+ "rank_pattern": {},
27
+ "revision": null,
28
+ "target_modules": [
29
+ "v_proj",
30
+ "down_proj",
31
+ "gate_proj",
32
+ "q_proj",
33
+ "up_proj",
34
+ "o_proj",
35
+ "k_proj"
36
+ ],
37
+ "task_type": "CAUSAL_LM",
38
+ "use_dora": false,
39
+ "use_rslora": false
40
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:612968e0d42aac2159e1bce89f8fb4dc9b4392304c973a2b6e4abd797ac49616
3
+ size 2839420184
added_tokens.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "<image>": 262145,
3
+ "<image_soft_token>": 262144
4
+ }
chat_template.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n<start_of_turn>user\n{% for content in message['content'] %}\n{% if content['type'] == 'text' %}{{ content['text'] }}{% elif content['type'] == 'image' %}<image>{% endif %}\n{% endfor %}\n<end_of_turn>\n{% elif message['role'] == 'assistant' %}\n<start_of_turn>model\n{% for content in message['content'] %}\n{% if content['type'] == 'text' %}{{ content['text'] }}{% endif %}\n{% endfor %}\n<end_of_turn>\n{% elif message['role'] == 'system' %}\n<start_of_turn>system\n{% for content in message['content'] %}\n{% if content['type'] == 'text' %}{{ content['text'] }}{% endif %}\n{% endfor %}\n<end_of_turn>\n{% endif %}\n{% endfor %}\n{% if add_generation_prompt %}\n<start_of_turn>model\n{% endif %}\n"
3
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": null,
3
+ "do_normalize": true,
4
+ "do_pan_and_scan": null,
5
+ "do_rescale": true,
6
+ "do_resize": true,
7
+ "image_mean": [
8
+ 0.5,
9
+ 0.5,
10
+ 0.5
11
+ ],
12
+ "image_processor_type": "Gemma3ImageProcessor",
13
+ "image_seq_length": 256,
14
+ "image_std": [
15
+ 0.5,
16
+ 0.5,
17
+ 0.5
18
+ ],
19
+ "pan_and_scan_max_num_crops": null,
20
+ "pan_and_scan_min_crop_size": null,
21
+ "pan_and_scan_min_ratio_to_activate": null,
22
+ "processor_class": "Gemma3Processor",
23
+ "resample": 2,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "height": 896,
27
+ "width": 896
28
+ }
29
+ }
processor_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "image_seq_length": 256,
3
+ "processor_class": "Gemma3Processor"
4
+ }
runs/Apr09_14-03-47_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744222380.atl1-1-01-006-9-0.pace.gatech.edu.3411561.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b099712647cc75a26184279946b4a99b8b6f21fb576555e14e81930f9491fce2
3
+ size 6908
runs/Apr09_14-59-17_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744225163.atl1-1-01-006-9-0.pace.gatech.edu.3411561.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:633c018a99115060533f7bc55021e56e7f3b435653ffd461a130c1dcdafc7915
3
+ size 6908
runs/Apr09_15-18-23_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744226306.atl1-1-01-006-9-0.pace.gatech.edu.3411561.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11170f24101004fd93086faa9511e22e15bca46855509ddd9c7a6bc035b0bcd0
3
+ size 6908
runs/Apr09_15-21-21_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744226484.atl1-1-01-006-9-0.pace.gatech.edu.3411561.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:580915628e96aaf1e94a433bb95e7b02d0a689c79b856fc19315d16f087a51b0
3
+ size 6908
runs/Apr09_15-23-48_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744226630.atl1-1-01-006-9-0.pace.gatech.edu.3411561.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32c2b228d5719e36e87854a52a79701c520c611c18870db32249130f7445d291
3
+ size 6908
runs/Apr09_15-23-48_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744227057.atl1-1-01-006-9-0.pace.gatech.edu.3411561.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e3409f76e31b3e20c15e1d92cf56cfd5b7d53bdc0c0f73158004d12e9433ae0
3
+ size 6908
runs/Apr09_15-23-48_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744227155.atl1-1-01-006-9-0.pace.gatech.edu.3411561.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70ab64a3a1e3e540cffa2eef82890f181536e2e6b2be29f7e0be3d09d36b3302
3
+ size 6908
runs/Apr09_15-23-48_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744227298.atl1-1-01-006-9-0.pace.gatech.edu.3411561.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5f4b5e8a6610df6045ace190e9b19443e70ebf1d93897ca4089918736103337
3
+ size 6908
runs/Apr09_16-37-05_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744231027.atl1-1-01-006-9-0.pace.gatech.edu.3640142.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88634e11039f4fe21cd4087e451114d655e47a44979631f30d7f205f514789dc
3
+ size 6908
runs/Apr09_16-39-06_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744231148.atl1-1-01-006-9-0.pace.gatech.edu.3640142.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62bdceff5ed5ee340b460a6cd6a0549a8329d867c2d2e407906215b055f60ebb
3
+ size 6900
runs/Apr09_18-08-18_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744236505.atl1-1-01-006-9-0.pace.gatech.edu.3640142.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a6e858019433f02f6d25272f11b6cc28518e1c51fd13203ab5a5bf2b6c8767e
3
+ size 6900
runs/Apr09_18-12-59_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744236781.atl1-1-01-006-9-0.pace.gatech.edu.3640142.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66baf705657e52d2ce8fd841d7446eb9fecfa006836752768dfd8735a2c5603b
3
+ size 6900
runs/Apr09_18-16-24_atl1-1-01-006-9-0.pace.gatech.edu/events.out.tfevents.1744236987.atl1-1-01-006-9-0.pace.gatech.edu.3640142.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e79fc0c42a1845bd955b331966e1bec594472dde0b3b8592a038d466201725b
3
+ size 7311
special_tokens_map.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "<image>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ }
10
+ ],
11
+ "boi_token": "<start_of_image>",
12
+ "bos_token": {
13
+ "content": "<bos>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false
18
+ },
19
+ "eoi_token": "<end_of_image>",
20
+ "eos_token": {
21
+ "content": "<eos>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false
26
+ },
27
+ "image_token": "<image_soft_token>",
28
+ "pad_token": {
29
+ "content": "<pad>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false
34
+ },
35
+ "unk_token": {
36
+ "content": "<unk>",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false
41
+ }
42
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6eea405950660db056020376b7bb728da9f4549eb5bfd6496bba40dde75e5658
3
+ size 33384906
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1299c11d7cf632ef3b4e11937501358ada021bbdf7c47638d13c0ee982f2e79c
3
+ size 4689074
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7cf9d1354764366452d0eef6d7b42d1b9bc3d377bd622b7a20ed6758f6d6fa3
3
+ size 5688