Training in progress, step 25
Browse files- adapter_config.json +34 -0
- adapter_model.safetensors +3 -0
- config.json +30 -0
- special_tokens_map.json +30 -0
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +0 -0
- training_args.bin +3 -0
    	
        adapter_config.json
    ADDED
    
    | @@ -0,0 +1,34 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
              "alpha_pattern": {},
         | 
| 3 | 
            +
              "auto_mapping": null,
         | 
| 4 | 
            +
              "base_model_name_or_path": "unsloth/mistral-7b-instruct-v0.3",
         | 
| 5 | 
            +
              "bias": "none",
         | 
| 6 | 
            +
              "fan_in_fan_out": null,
         | 
| 7 | 
            +
              "inference_mode": true,
         | 
| 8 | 
            +
              "init_lora_weights": true,
         | 
| 9 | 
            +
              "layer_replication": null,
         | 
| 10 | 
            +
              "layers_pattern": null,
         | 
| 11 | 
            +
              "layers_to_transform": null,
         | 
| 12 | 
            +
              "loftq_config": {},
         | 
| 13 | 
            +
              "lora_alpha": 64,
         | 
| 14 | 
            +
              "lora_dropout": 0.05,
         | 
| 15 | 
            +
              "megatron_config": null,
         | 
| 16 | 
            +
              "megatron_core": "megatron.core",
         | 
| 17 | 
            +
              "modules_to_save": null,
         | 
| 18 | 
            +
              "peft_type": "LORA",
         | 
| 19 | 
            +
              "r": 32,
         | 
| 20 | 
            +
              "rank_pattern": {},
         | 
| 21 | 
            +
              "revision": null,
         | 
| 22 | 
            +
              "target_modules": [
         | 
| 23 | 
            +
                "v_proj",
         | 
| 24 | 
            +
                "o_proj",
         | 
| 25 | 
            +
                "k_proj",
         | 
| 26 | 
            +
                "down_proj",
         | 
| 27 | 
            +
                "up_proj",
         | 
| 28 | 
            +
                "q_proj",
         | 
| 29 | 
            +
                "gate_proj"
         | 
| 30 | 
            +
              ],
         | 
| 31 | 
            +
              "task_type": "CAUSAL_LM",
         | 
| 32 | 
            +
              "use_dora": false,
         | 
| 33 | 
            +
              "use_rslora": false
         | 
| 34 | 
            +
            }
         | 
    	
        adapter_model.safetensors
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:6c696cab0a3d3a6350c331a2fa51b164096d09045d83c85832605ebb6c37a08a
         | 
| 3 | 
            +
            size 335604696
         | 
    	
        config.json
    ADDED
    
    | @@ -0,0 +1,30 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
              "_attn_implementation_autoset": true,
         | 
| 3 | 
            +
              "_name_or_path": "unsloth/mistral-7b-instruct-v0.3",
         | 
| 4 | 
            +
              "architectures": [
         | 
| 5 | 
            +
                "MistralForCausalLM"
         | 
| 6 | 
            +
              ],
         | 
| 7 | 
            +
              "attention_dropout": 0.0,
         | 
| 8 | 
            +
              "bos_token_id": 1,
         | 
| 9 | 
            +
              "eos_token_id": 2,
         | 
| 10 | 
            +
              "head_dim": 128,
         | 
| 11 | 
            +
              "hidden_act": "silu",
         | 
| 12 | 
            +
              "hidden_size": 4096,
         | 
| 13 | 
            +
              "initializer_range": 0.02,
         | 
| 14 | 
            +
              "intermediate_size": 14336,
         | 
| 15 | 
            +
              "max_position_embeddings": 32768,
         | 
| 16 | 
            +
              "model_type": "mistral",
         | 
| 17 | 
            +
              "num_attention_heads": 32,
         | 
| 18 | 
            +
              "num_hidden_layers": 32,
         | 
| 19 | 
            +
              "num_key_value_heads": 8,
         | 
| 20 | 
            +
              "pad_token_id": 770,
         | 
| 21 | 
            +
              "rms_norm_eps": 1e-05,
         | 
| 22 | 
            +
              "rope_theta": 1000000.0,
         | 
| 23 | 
            +
              "sliding_window": null,
         | 
| 24 | 
            +
              "tie_word_embeddings": false,
         | 
| 25 | 
            +
              "torch_dtype": "bfloat16",
         | 
| 26 | 
            +
              "transformers_version": "4.46.0",
         | 
| 27 | 
            +
              "unsloth_version": "2024.9",
         | 
| 28 | 
            +
              "use_cache": false,
         | 
| 29 | 
            +
              "vocab_size": 32768
         | 
| 30 | 
            +
            }
         | 
    	
        special_tokens_map.json
    ADDED
    
    | @@ -0,0 +1,30 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
              "bos_token": {
         | 
| 3 | 
            +
                "content": "<s>",
         | 
| 4 | 
            +
                "lstrip": false,
         | 
| 5 | 
            +
                "normalized": false,
         | 
| 6 | 
            +
                "rstrip": false,
         | 
| 7 | 
            +
                "single_word": false
         | 
| 8 | 
            +
              },
         | 
| 9 | 
            +
              "eos_token": {
         | 
| 10 | 
            +
                "content": "</s>",
         | 
| 11 | 
            +
                "lstrip": false,
         | 
| 12 | 
            +
                "normalized": false,
         | 
| 13 | 
            +
                "rstrip": false,
         | 
| 14 | 
            +
                "single_word": false
         | 
| 15 | 
            +
              },
         | 
| 16 | 
            +
              "pad_token": {
         | 
| 17 | 
            +
                "content": "[control_768]",
         | 
| 18 | 
            +
                "lstrip": false,
         | 
| 19 | 
            +
                "normalized": false,
         | 
| 20 | 
            +
                "rstrip": false,
         | 
| 21 | 
            +
                "single_word": false
         | 
| 22 | 
            +
              },
         | 
| 23 | 
            +
              "unk_token": {
         | 
| 24 | 
            +
                "content": "<unk>",
         | 
| 25 | 
            +
                "lstrip": false,
         | 
| 26 | 
            +
                "normalized": false,
         | 
| 27 | 
            +
                "rstrip": false,
         | 
| 28 | 
            +
                "single_word": false
         | 
| 29 | 
            +
              }
         | 
| 30 | 
            +
            }
         | 
    	
        tokenizer.json
    ADDED
    
    | The diff for this file is too large to render. 
		See raw diff | 
|  | 
    	
        tokenizer.model
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:37f00374dea48658ee8f5d0f21895b9bc55cb0103939607c8185bfd1c6ca1f89
         | 
| 3 | 
            +
            size 587404
         | 
    	
        tokenizer_config.json
    ADDED
    
    | The diff for this file is too large to render. 
		See raw diff | 
|  | 
    	
        training_args.bin
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:9d401b9cfc85dbf263a7cf3ff2b450f4fcc8ea2fc50bf490703ff61e99681b31
         | 
| 3 | 
            +
            size 6840
         |