Upload folder using huggingface_hub

Files changed (3) hide show

README.md ADDED Viewed

+---
+library_name: peft
+tags:
+- generated_from_trainer
+datasets:
+- 05466d56569b55db_train_data.json
+base_model: defog/sqlcoder-7b-2
+model-index:
+- name: JacksonBrune/87230327-b73a-4d52-a711-20a7e1f47c73
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# JacksonBrune/87230327-b73a-4d52-a711-20a7e1f47c73
+This model was trained from scratch on the /root/tmp/05466d56569b55db_train_data.json dataset.
+It achieves the following results on the evaluation set:
+- Loss: 1.1037
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+### Framework versions
+- PEFT 0.15.0
+- Transformers 4.50.3
+- Pytorch 2.5.1+cu124
+- Datasets 3.5.0
+- Tokenizers 0.21.1

adapter_config.json ADDED Viewed

+{
+    "alpha_pattern": {},
+    "auto_mapping": null,
+    "base_model_name_or_path": "defog/sqlcoder-7b-2",
+    "bias": "none",
+    "corda_config": null,
+    "eva_config": {
+        "adjust_scaling_factors": true,
+        "label_mask_value": -100,
+        "rho": 2.0,
+        "tau": 0.99,
+        "use_label_mask": true,
+        "whiten": false
+    },
+    "exclude_modules": null,
+    "fan_in_fan_out": null,
+    "inference_mode": true,
+    "init_lora_weights": "eva",
+    "layer_replication": null,
+    "layers_pattern": null,
+    "layers_to_transform": null,
+    "loftq_config": {},
+    "lora_alpha": 256,
+    "lora_bias": false,
+    "lora_dropout": 0.05,
+    "megatron_config": null,
+    "megatron_core": "megatron.core",
+    "modules_to_save": null,
+    "peft_type": "LORA",
+    "r": 128,
+    "rank_pattern": {},
+    "revision": null,
+    "target_modules": [
+        "(?:language_model.)?model.layers.[\\d]+.(mlp|cross_attn|self_attn).(up|down|gate|q|k|v|o)_proj",
+        "gate_proj",
+        "down_proj",
+        "k_proj",
+        "v_proj",
+        "q_proj",
+        "o_proj",
+        "up_proj"
+    ],
+    "task_type": "CAUSAL_LM",
+    "trainable_token_indices": null,
+    "use_dora": false,
+    "use_rslora": false
+}

adapter_model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6be6f698d008927596126dfbbcc9095b4b56443c87d507154df5a679c98849c1
+size 639692768