ovokpus/llama381binstruct_summarize_short

Files changed (7) hide show

README.md CHANGED Viewed

@@ -27,17 +27,17 @@ print(output["generated_text"])
 ## Training procedure
-[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/ovokpus/huggingface/runs/7gmrjvtn)
 This model was trained with SFT.
 ### Framework versions
-- TRL: 0.17.0
-- Transformers: 4.51.3
 - Pytorch: 2.6.0+cu124
-- Datasets: 3.5.1
 - Tokenizers: 0.21.1
 ## Citations

 ## Training procedure
+[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/ovokpus/huggingface/runs/tyv79v8k)
 This model was trained with SFT.
 ### Framework versions
+- TRL: 0.19.0
+- Transformers: 4.52.4
 - Pytorch: 2.6.0+cu124
+- Datasets: 3.6.0
 - Tokenizers: 0.21.1
 ## Citations

adapter_config.json CHANGED Viewed

@@ -24,13 +24,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
-    "q_proj",
     "down_proj",
-    "o_proj",
-    "k_proj",
     "up_proj",
-    "gate_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "k_proj",
+    "o_proj",
     "v_proj",
     "down_proj",
+    "gate_proj",
     "up_proj",
+    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3a1377efb4df2db6d4d05f944743f22490e070ac830c10715f16ff995b2703b4
 size 167832240

 version https://git-lfs.github.com/spec/v1
+oid sha256:20929019d4dced5c6fc250098271eb49d546860ba0a2a66dd5007f73f5c2baa3
 size 167832240

chat_template.jinja ADDED Viewed

+{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>
+'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{{ '<|start_header_id|>assistant<|end_header_id|>
+' }}

runs/Jun23_19-24-34_9d64d03a1a51/events.out.tfevents.1750706706.9d64d03a1a51.2883.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ccbf062fc10a52c0fb273d59084cc32c3d489cacb30e1cf1145e4294de15ba1
+size 30742

tokenizer_config.json CHANGED Viewed

@@ -2050,7 +2050,6 @@
     }
   },
   "bos_token": "<|begin_of_text|>",
-  "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}",
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|eot_id|>",
   "extra_special_tokens": {},

     }
   },
   "bos_token": "<|begin_of_text|>",
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|eot_id|>",
   "extra_special_tokens": {},

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:91a52bcd40464001ad545f1b8ee1f5b0363fd438c9a891e43be975fd56012dfa
 size 5752

 version https://git-lfs.github.com/spec/v1
+oid sha256:408cde1a98115358f3d90ea98262cfa7e7dc5ee2b91236d7b980314b777f0176
 size 5752