Dia-1.6B / config.json
NariLabs's picture
Push model using huggingface_hub.
ed6eb51 verified
raw
history blame contribute delete
941 Bytes
{
"data": {
"audio_bos_value": 1026,
"audio_eos_value": 1024,
"audio_length": 3072,
"audio_pad_value": 1025,
"channels": 9,
"delay_pattern": [
0,
8,
9,
10,
11,
12,
13,
14,
15
],
"text_length": 1024,
"text_pad_value": 0
},
"model": {
"decoder": {
"cross_head_dim": 128,
"cross_query_heads": 16,
"gqa_head_dim": 128,
"gqa_query_heads": 16,
"kv_heads": 4,
"n_embd": 2048,
"n_hidden": 8192,
"n_layer": 18
},
"dropout": 0.0,
"encoder": {
"head_dim": 128,
"n_embd": 1024,
"n_head": 16,
"n_hidden": 4096,
"n_layer": 12
},
"normalization_layer_epsilon": 1e-05,
"rope_max_timescale": 10000,
"rope_min_timescale": 1,
"src_vocab_size": 256,
"tgt_vocab_size": 1028,
"weight_dtype": "float32"
},
"training": {},
"version": "0.1"
}