nari-labs
/

Dia-1.6B-0626

model_hub_mixin

pytorch_model_hub_mixin

Model card Files Files and versions

buttercrab commited on Jun 24

Commit

a7aa612

·

verified ·

1 Parent(s): d1981a1

Upload 2 files

Files changed (2) hide show

config.json +50 -0
preprocessor_config.json +7 -0

config.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+  "data": {
+    "audio_bos_value": 1026,
+    "audio_eos_value": 1024,
+    "audio_length": 3072,
+    "audio_pad_value": 1025,
+    "channels": 9,
+    "delay_pattern": [
+      0,
+      8,
+      9,
+      10,
+      11,
+      12,
+      13,
+      14,
+      15
+    ],
+    "text_length": 1024,
+    "text_pad_value": 0
+  },
+  "model": {
+    "decoder": {
+      "cross_head_dim": 128,
+      "cross_query_heads": 16,
+      "gqa_head_dim": 128,
+      "gqa_query_heads": 16,
+      "kv_heads": 4,
+      "n_embd": 2048,
+      "n_hidden": 8192,
+      "n_layer": 18
+    },
+    "dropout": 0.0,
+    "encoder": {
+      "head_dim": 128,
+      "n_embd": 1024,
+      "n_head": 16,
+      "n_hidden": 4096,
+      "n_layer": 12
+    },
+    "normalization_layer_epsilon": 1e-05,
+    "rope_max_timescale": 10000,
+    "rope_min_timescale": 1,
+    "src_vocab_size": 256,
+    "tgt_vocab_size": 1028,
+    "weight_dtype": "float32"
+  },
+  "training": {},
+  "version": "0.1"
+}

preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "feature_extractor_type": "DacFeatureExtractor",
+  "processor_class": "DiaProcessor",
+  "audio_eos_value": 1024,
+  "audio_pad_value": 1025,
+  "audio_bos_value": 1026
+}