cfpark00
/

toy-multistep-v2-nn_20-na_10

Text Generation

text-generation-inference

Model card Files Files and versions

cfpark00 commited on May 5

Commit

6a78423

·

verified ·

1 Parent(s): b807885

Upload Qwen2ForCausalLM

Files changed (2) hide show

config.json +4 -4
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -4,15 +4,15 @@
   ],
   "attention_dropout": 0.0,
   "hidden_act": "silu",
-  "hidden_size": 64,
   "initializer_range": 0.02,
-  "intermediate_size": 256,
   "max_position_embeddings": 32768,
   "max_window_layers": 28,
   "model_type": "qwen2",
-  "num_attention_heads": 4,
   "num_hidden_layers": 4,
-  "num_key_value_heads": 4,
   "rms_norm_eps": 1e-06,
   "rope_scaling": null,
   "rope_theta": 10000.0,

   ],
   "attention_dropout": 0.0,
   "hidden_act": "silu",
+  "hidden_size": 128,
   "initializer_range": 0.02,
+  "intermediate_size": 512,
   "max_position_embeddings": 32768,
   "max_window_layers": 28,
   "model_type": "qwen2",
+  "num_attention_heads": 2,
   "num_hidden_layers": 4,
+  "num_key_value_heads": 2,
   "rms_norm_eps": 1e-06,
   "rope_scaling": null,
   "rope_theta": 10000.0,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b2341fc94acde770f527ee25d99e59b646b8969ae5be077d95d780aaf17edaa8
-size 1073488

 version https://git-lfs.github.com/spec/v1
+oid sha256:70c4ddcf0d5e66b1567f1092a89b3ec5a49d2423c0cdaee0839229adbd864f07
+size 4239064