Training in progress, step 500

Files changed (4) hide show

adapter_config.json CHANGED Viewed

@@ -3,6 +3,9 @@
   "auto_mapping": null,
   "base_model_name_or_path": "unsloth/SmolLM-135M",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
@@ -11,26 +14,27 @@
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 256,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
-  "modules_to_save": [
-    "lm_head"
-  ],
   "peft_type": "LORA",
   "r": 128,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "up_proj",
     "gate_proj",
-    "k_proj",
     "q_proj",
     "o_proj",
-    "down_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,
   "use_rslora": false
 }

   "auto_mapping": null,
   "base_model_name_or_path": "unsloth/SmolLM-135M",
   "bias": "none",
+  "corda_config": null,
+  "eva_config": null,
+  "exclude_modules": null,
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 256,
+  "lora_bias": false,
   "lora_dropout": 0.1,
   "megatron_config": null,
   "megatron_core": "megatron.core",
+  "modules_to_save": null,
   "peft_type": "LORA",
   "r": 128,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "gate_proj",
+    "v_proj",
     "q_proj",
+    "k_proj",
+    "down_proj",
     "o_proj",
+    "lm_head",
+    "up_proj"
   ],
   "task_type": "CAUSAL_LM",
+  "trainable_token_indices": null,
   "use_dora": false,
   "use_rslora": false
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a5d1546255d34f3dc2901fa11c692ec5c82cdbd7118cf88e6f9a4bfff52a52e8
-size 212982848

 version https://git-lfs.github.com/spec/v1
+oid sha256:9f091d40d50198e530f01b9a25487cd690a670b42ab8b3fa59ef973cece5faa3
+size 238444008

tokenizer_config.json CHANGED Viewed

@@ -158,7 +158,6 @@
     "<empty_output>"
   ],
   "bos_token": "<|endoftext|>",
-  "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|endoftext|>",
   "extra_special_tokens": {},

     "<empty_output>"
   ],
   "bos_token": "<|endoftext|>",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<|endoftext|>",
   "extra_special_tokens": {},

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4de8c82b3a1eb8557fc65c97f260c3a594685bcf8ee4b1039657d52e3136a0ec
-size 7096

 version https://git-lfs.github.com/spec/v1
+oid sha256:2f846d36aae485459ed98faa0c0b1bdadf6bf66458553293b2754e96264b2078
+size 5752