Push model using huggingface_hub.

Files changed (3) hide show

README.md ADDED Viewed

+---
+license: apache-2.0
+pipeline_tag: text-to-speech
+tags:
+- model_hub_mixin
+- pytorch_model_hub_mixin
+---
+This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
+- Code: https://github.com/nari-labs/dia
+- Paper: [More Information Needed]
+- Docs: [More Information Needed]

config.json ADDED Viewed

+{
+  "data": {
+    "audio_bos_value": 1026,
+    "audio_eos_value": 1024,
+    "audio_length": 3072,
+    "audio_pad_value": 1025,
+    "channels": 9,
+    "delay_pattern": [
+      0,
+      8,
+      9,
+      10,
+      11,
+      12,
+      13,
+      14,
+      15
+    ],
+    "text_length": 1024,
+    "text_pad_value": 0
+  },
+  "model": {
+    "decoder": {
+      "cross_head_dim": 128,
+      "cross_query_heads": 16,
+      "gqa_head_dim": 128,
+      "gqa_query_heads": 16,
+      "kv_heads": 4,
+      "n_embd": 2048,
+      "n_hidden": 8192,
+      "n_layer": 18
+    },
+    "dropout": 0.0,
+    "encoder": {
+      "head_dim": 128,
+      "n_embd": 1024,
+      "n_head": 16,
+      "n_hidden": 4096,
+      "n_layer": 12
+    },
+    "normalization_layer_epsilon": 1e-05,
+    "rope_max_timescale": 10000,
+    "rope_min_timescale": 1,
+    "src_vocab_size": 256,
+    "tgt_vocab_size": 1028,
+    "weight_dtype": "float32"
+  },
+  "training": {},
+  "version": "0.1"
+}

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:caba289b60f6d7d1e58fc744f4dc25aae88995fcca46be3d05e220b971486a26
+size 6444682848