{ | |
"data": { | |
"audio_bos_value": 1026, | |
"audio_eos_value": 1024, | |
"audio_length": 3072, | |
"audio_pad_value": 1025, | |
"channels": 9, | |
"delay_pattern": [ | |
0, | |
8, | |
9, | |
10, | |
11, | |
12, | |
13, | |
14, | |
15 | |
], | |
"text_length": 1024, | |
"text_pad_value": 0 | |
}, | |
"model": { | |
"decoder": { | |
"cross_head_dim": 128, | |
"cross_query_heads": 16, | |
"gqa_head_dim": 128, | |
"gqa_query_heads": 16, | |
"kv_heads": 4, | |
"n_embd": 2048, | |
"n_hidden": 8192, | |
"n_layer": 18 | |
}, | |
"dropout": 0.0, | |
"encoder": { | |
"head_dim": 128, | |
"n_embd": 1024, | |
"n_head": 16, | |
"n_hidden": 4096, | |
"n_layer": 12 | |
}, | |
"normalization_layer_epsilon": 1e-05, | |
"rope_max_timescale": 10000, | |
"rope_min_timescale": 1, | |
"src_vocab_size": 256, | |
"tgt_vocab_size": 1028, | |
"weight_dtype": "float32" | |
}, | |
"training": {}, | |
"version": "0.1" | |
} |