AlSamCur123 commited on
Commit
7623f17
·
verified ·
1 Parent(s): d16f729

Trained with Unsloth

Browse files
config.json CHANGED
@@ -1,3 +1,30 @@
1
  {
2
- "model_type": "mistral"
3
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  {
2
+ "_name_or_path": "AlSamCur123/Nemo-InstructContinuedFine",
3
+ "architectures": [
4
+ "MistralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 5120,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 14336,
14
+ "max_position_embeddings": 1024000,
15
+ "model_type": "mistral",
16
+ "num_attention_heads": 32,
17
+ "num_hidden_layers": 40,
18
+ "num_key_value_heads": 8,
19
+ "pad_token_id": 10,
20
+ "rms_norm_eps": 1e-05,
21
+ "rope_scaling": null,
22
+ "rope_theta": 1000000.0,
23
+ "sliding_window": null,
24
+ "tie_word_embeddings": false,
25
+ "torch_dtype": "float16",
26
+ "transformers_version": "4.47.1",
27
+ "unsloth_version": "2025.1.7",
28
+ "use_cache": true,
29
+ "vocab_size": 131072
30
+ }
model-00001-of-00005.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15ac87eb2ae1b2b358b9201f9b055fcb7002e7e4b67f4581423f80fcc0de0b2a
3
  size 4865522432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acf373ff7b78cc0f9a77655ae011dd30aeb68519046b41f22d13b4322352247b
3
  size 4865522432
model-00002-of-00005.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14aa2d28d5eaa7bff197aa04d3983fcdbc38ca5e8813597178462f46997d1c58
3
  size 4907529344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abaab8df157d57f031b3bff9f411905fb77cf161cf52a65fcc06db3454ff6c02
3
  size 4907529344
model-00003-of-00005.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35a2fc7ff05dd0605115feb7cb50d7e8605ced50664d60acad76f2b87a21063d
3
  size 4907529376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dade7bea3b7294c8b43cb56d57f76fe3d4d99f020fe5b50f9b548a2a48e5a78
3
  size 4907529376
model-00004-of-00005.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9a41cb97f4ddb2f24d0ebc2f8f51d4f3956517f750d816129085970f3925311
3
  size 4907529376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a29e9ada68c69a9de4fc8560ee6417998ffcbff1824ac8d72abd62975a64016a
3
  size 4907529376
model-00005-of-00005.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b13d9b0018d06aacb330dbc57d90181242c6ff9bea993597e66a5fb45cad1e82
3
  size 4907496208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:213d9161b0219292a6d6f7f0bfeba6e872cd7321ab5a884dd3b9500f9a59e17e
3
  size 4907496208