From 3ca3d8100fd45fc5e430afe8cc2628437c8be186 Mon Sep 17 00:00:00 2001
From: Cherrytest <cherrytest@163.com>
Date: Fri, 30 May 2025 01:08:13 +0000
Subject: [PATCH] Upload folder using ModelScope SDK

---
 README.md          |  130 ++--
 conds.pt           |    3 +
 configuration.json |    1 +
 s3gen.pt           |    3 +
 t3_cfg.pt          |    3 +
 tokenizer.json     | 1435 ++++++++++++++++++++++++++++++++++++++++++++
 ve.pt              |    3 +
 7 files changed, 1537 insertions(+), 41 deletions(-)
 create mode 100644 conds.pt
 create mode 100644 configuration.json
 create mode 100644 s3gen.pt
 create mode 100644 t3_cfg.pt
 create mode 100644 tokenizer.json
 create mode 100644 ve.pt
diff --git a/README.md b/README.md
index a2bd580..e21b3f4 100644
--- a/README.md
+++ b/README.md
@@ -1,47 +1,95 @@
 ---
-license: Apache License 2.0
-
-#model-type:
-##如 gpt、phi、llama、chatglm、baichuan 等
-#- gpt
-
-#domain:
-##如 nlp、cv、audio、multi-modal
-#- nlp
-
-#language:
-##语言代码列表 https://help.aliyun.com/document_detail/215387.html?spm=a2c4g.11186623.0.0.9f8d7467kni6Aa
-#- cn 
-
-#metrics:
-##如 CIDEr、Blue、ROUGE 等
-#- CIDEr
-
-#tags:
-##各种自定义，包括 pretrained、fine-tuned、instruction-tuned、RL-tuned 等训练方法和其他
-#- pretrained
-
-#tools:
-##如 vllm、fastchat、llamacpp、AdaSeq 等
-#- vllm
+license: mit
+language:
+- en
+tags:
+- text-to-speech
+- speech generation
+- voice-cloning
+pipeline_tag: text-to-speech
+library_name: chatterbox
 ---
-### 当前模型的贡献者未提供更加详细的模型介绍。模型文件和权重，可浏览“模型文件”页面获取。
-#### 您可以通过如下git clone命令，或者ModelScope SDK来下载模型
 
-SDK下载
-```bash
-#安装ModelScope
-pip install modelscope
+<img width="800" alt="cb-big2" src="https://github.com/user-attachments/assets/bd8c5f03-e91d-4ee5-b680-57355da204d1" />
+
+<h1 style="font-size: 32px">Chatterbox TTS</h1>
+
+<div style="display: flex; align-items: center; gap: 12px">
+  <a href="https://resemble-ai.github.io/chatterbox_demopage/">
+    <img src="https://img.shields.io/badge/listen-demo_samples-blue" alt="Listen to Demo Samples" />
+  </a>
+  <a href="https://huggingface.co/spaces/ResembleAI/Chatterbox">
+    <img src="https://huggingface.co/datasets/huggingface/badges/resolve/main/open-in-hf-spaces-sm.svg" alt="Open in HF Spaces" />
+  </a>
+  <a href="https://podonos.com/resembleai/chatterbox">
+    <img src="https://static-public.podonos.com/badges/insight-on-pdns-sm-dark.svg" alt="Insight on Podos" />
+  </a>
+</div>
+
+<div style="display: flex; align-items: center; gap: 8px;">
+  <span style="font-style: italic;white-space: pre-wrap">Made with  ❤️  by</span>
+  <img width="100" alt="resemble-logo-horizontal" src="https://github.com/user-attachments/assets/35cf756b-3506-4943-9c72-c05ddfa4e525" />
+</div>
+
+
+We're excited to introduce Chatterbox, [Resemble AI's](https://resemble.ai) first production-grade open source TTS model. Licensed under MIT, Chatterbox has been benchmarked against leading closed-source systems like ElevenLabs, and is consistently preferred in side-by-side evaluations.
+
+Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life. It's also the first open source TTS model to support **emotion exaggeration control**, a powerful feature that makes your voices stand out. Try it now on our [Hugging Face Gradio app.](https://huggingface.co/spaces/ResembleAI/Chatterbox)
+
+If you like the model but need to scale or tune it for higher accuracy, check out our competitively priced TTS service (<a href="https://resemble.ai">link</a>). It delivers reliable performance with ultra-low latency of sub 200ms—ideal for production use in agents, applications, or interactive media.
+
+# Key Details
+- SoTA zeroshot TTS
+- 0.5B Llama backbone
+- Unique exaggeration/intensity control
+- Ultra-stable with alignment-informed inference
+- Trained on 0.5M hours of cleaned data
+- Watermarked outputs
+- Easy voice conversion script
+- [Outperforms ElevenLabs](https://podonos.com/resembleai/chatterbox)
+
+# Tips
+- **General Use (TTS and Voice Agents):**
+  - The default settings (`exaggeration=0.5`, `cfg=0.5`) work well for most prompts.
+  - If the reference speaker has a fast speaking style, lowering `cfg` to around `0.3` can improve pacing.
+
+- **Expressive or Dramatic Speech:**
+  - Try lower `cfg` values (e.g. `~0.3`) and increase `exaggeration` to around `0.7` or higher.
+  - Higher `exaggeration` tends to speed up speech; reducing `cfg` helps compensate with slower, more deliberate pacing.
+
+
+# Installation
 ```
+pip install chatterbox-tts
+```
+
+
+# Usage
 ```python
-#SDK模型下载
-from modelscope import snapshot_download
-model_dir = snapshot_download('ResembleAI/chatterbox')
-```
-Git下载
-```
-#Git模型下载
-git clone https://www.modelscope.cn/ResembleAI/chatterbox.git
-```
+import torchaudio as ta
+from chatterbox.tts import ChatterboxTTS
 
-<p style="color: lightgrey;">如果您是本模型的贡献者，我们邀请您根据<a href="https://modelscope.cn/docs/ModelScope%E6%A8%A1%E5%9E%8B%E6%8E%A5%E5%85%A5%E6%B5%81%E7%A8%8B%E6%A6%82%E8%A7%88" style="color: lightgrey; text-decoration: underline;">模型贡献文档</a>，及时完善模型卡片内容。</p>
\ No newline at end of file
+model = ChatterboxTTS.from_pretrained(device="cuda")
+
+text = "Ezreal and Jinx teamed up with Ahri, Yasuo, and Teemo to take down the enemy's Nexus in an epic late-game pentakill."
+wav = model.generate(text)
+ta.save("test-1.wav", wav, model.sr)
+
+# If you want to synthesize with a different voice, specify the audio prompt
+AUDIO_PROMPT_PATH="YOUR_FILE.wav"
+wav = model.generate(text, audio_prompt_path=AUDIO_PROMPT_PATH)
+ta.save("test-2.wav", wav, model.sr)
+```
+See `example_tts.py` for more examples.
+
+# Acknowledgements
+- [Cosyvoice](https://github.com/FunAudioLLM/CosyVoice)
+- [HiFT-GAN](https://github.com/yl4579/HiFTNet)
+- [Llama 3](https://github.com/meta-llama/llama3)
+
+# Built-in PerTh Watermarking for Responsible AI
+
+Every audio file generated by Chatterbox includes [Resemble AI's Perth (Perceptual Threshold) Watermarker](https://github.com/resemble-ai/perth) - imperceptible neural watermarks that survive MP3 compression, audio editing, and common manipulations while maintaining nearly 100% detection accuracy.
+
+# Disclaimer
+Don't use this model to do bad things. Prompts are sourced from freely available data on the internet.
\ No newline at end of file
diff --git a/conds.pt b/conds.pt
new file mode 100644
index 0000000..8df726b
--- /dev/null
+++ b/conds.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d8735c4576e072a701ab714206ab9e64972ea15fff6ef9ba5e83db7ce2b883f9
+size 131
diff --git a/configuration.json b/configuration.json
new file mode 100644
index 0000000..591fb74
--- /dev/null
+++ b/configuration.json
@@ -0,0 +1 @@
+{"framework": "pytorch", "task": "text-to-speech", "allow_remote": true}
\ No newline at end of file
diff --git a/s3gen.pt b/s3gen.pt
new file mode 100644
index 0000000..2892e72
--- /dev/null
+++ b/s3gen.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4b4eaf6211ebb34eb9fdc6c06f325e9184e8becce81d941a6d7f13ffae07f7d
+size 135
diff --git a/t3_cfg.pt b/t3_cfg.pt
new file mode 100644
index 0000000..b8e7ffc
--- /dev/null
+++ b/t3_cfg.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1f5841c51b445f505f448594b622c089bb488dd82410419632643b665cfa68d1
+size 135
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000..abd07c7
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,1435 @@
+{
+  "version": "1.0",
+  "truncation": null,
+  "padding": null,
+  "added_tokens": [
+    {
+      "id": 0,
+      "special": true,
+      "content": "[STOP]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false
+    },
+    {
+      "id": 1,
+      "special": true,
+      "content": "[UNK]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false
+    },
+    {
+      "id": 2,
+      "special": true,
+      "content": "[SPACE]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false
+    },
+    {
+      "id": 255,
+      "special": true,
+      "content": "[START]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false
+    },
+    {
+      "id": 604,
+      "content": "[UH]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 605,
+      "content": "[UM]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 606,
+      "content": "[giggle]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 607,
+      "content": "[laughter]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 608,
+      "content": "[guffaw]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 609,
+      "content": "[inhale]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 610,
+      "content": "[exhale]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 611,
+      "content": "[sigh]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 612,
+      "content": "[cry]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 613,
+      "content": "[bark]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 614,
+      "content": "[howl]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 615,
+      "content": "[meow]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 616,
+      "content": "[singing]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 617,
+      "content": "[music]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 618,
+      "content": "[whistle]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 619,
+      "content": "[humming]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 620,
+      "content": "[gasp]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 621,
+      "content": "[groan]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 622,
+      "content": "[whisper]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 623,
+      "content": "[mumble]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 624,
+      "content": "[sniff]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 625,
+      "content": "[sneeze]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 626,
+      "content": "[cough]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 627,
+      "content": "[snore]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 628,
+      "content": "[chew]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 629,
+      "content": "[sip]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 630,
+      "content": "[clear_throat]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 631,
+      "content": "[kiss]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 632,
+      "content": "[shhh]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 633,
+      "content": "[gibberish]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 634,
+      "content": "[fr]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 635,
+      "content": "[es]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 636,
+      "content": "[de]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 637,
+      "content": "[it]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 638,
+      "content": "[ipa]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 639,
+      "content": "[end_of_label]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 695,
+      "content": "[PLACEHOLDER55]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 696,
+      "content": "[PLACEHOLDER56]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 697,
+      "content": "[PLACEHOLDER57]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 698,
+      "content": "[PLACEHOLDER58]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 699,
+      "content": "[PLACEHOLDER59]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 700,
+      "content": "[PLACEHOLDER60]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 701,
+      "content": "[PLACEHOLDER61]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 702,
+      "content": "[PLACEHOLDER62]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 703,
+      "content": "[PLACEHOLDER63]",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    }
+  ],
+  "normalizer": null,
+  "pre_tokenizer": {
+    "type": "Whitespace"
+  },
+  "post_processor": null,
+  "decoder": null,
+  "model": {
+    "type": "BPE",
+    "dropout": null,
+    "unk_token": "[UNK]",
+    "continuing_subword_prefix": null,
+    "end_of_word_suffix": null,
+    "fuse_unk": false,
+    "vocab": {
+      "[STOP]": 0,
+      "[UNK]": 1,
+      "[SPACE]": 2,
+      "!": 3,
+      "'": 4,
+      "(": 5,
+      ")": 6,
+      ",": 7,
+      "-": 8,
+      ".": 9,
+      "/": 10,
+      ":": 11,
+      ";": 12,
+      "?": 13,
+      "a": 14,
+      "b": 15,
+      "c": 16,
+      "d": 17,
+      "e": 18,
+      "f": 19,
+      "g": 20,
+      "h": 21,
+      "i": 22,
+      "j": 23,
+      "k": 24,
+      "l": 25,
+      "m": 26,
+      "n": 27,
+      "o": 28,
+      "p": 29,
+      "q": 30,
+      "r": 31,
+      "s": 32,
+      "t": 33,
+      "u": 34,
+      "v": 35,
+      "w": 36,
+      "x": 37,
+      "y": 38,
+      "z": 39,
+      "th": 40,
+      "in": 41,
+      "the": 42,
+      "an": 43,
+      "er": 44,
+      "ou": 45,
+      "re": 46,
+      "on": 47,
+      "at": 48,
+      "ed": 49,
+      "en": 50,
+      "to": 51,
+      "ing": 52,
+      "and": 53,
+      "is": 54,
+      "as": 55,
+      "al": 56,
+      "or": 57,
+      "of": 58,
+      "ar": 59,
+      "it": 60,
+      "es": 61,
+      "he": 62,
+      "st": 63,
+      "le": 64,
+      "om": 65,
+      "se": 66,
+      "be": 67,
+      "ad": 68,
+      "ow": 69,
+      "ly": 70,
+      "ch": 71,
+      "wh": 72,
+      "that": 73,
+      "you": 74,
+      "li": 75,
+      "ve": 76,
+      "ac": 77,
+      "ti": 78,
+      "ld": 79,
+      "me": 80,
+      "was": 81,
+      "gh": 82,
+      "id": 83,
+      "ll": 84,
+      "wi": 85,
+      "ent": 86,
+      "for": 87,
+      "ay": 88,
+      "ro": 89,
+      "ver": 90,
+      "ic": 91,
+      "her": 92,
+      "ke": 93,
+      "his": 94,
+      "no": 95,
+      "ut": 96,
+      "un": 97,
+      "ir": 98,
+      "lo": 99,
+      "we": 100,
+      "ri": 101,
+      "ha": 102,
+      "with": 103,
+      "ght": 104,
+      "out": 105,
+      "im": 106,
+      "ion": 107,
+      "all": 108,
+      "ab": 109,
+      "one": 110,
+      "ne": 111,
+      "ge": 112,
+      "ould": 113,
+      "ter": 114,
+      "mo": 115,
+      "had": 116,
+      "ce": 117,
+      "she": 118,
+      "go": 119,
+      "sh": 120,
+      "ur": 121,
+      "am": 122,
+      "so": 123,
+      "pe": 124,
+      "my": 125,
+      "de": 126,
+      "are": 127,
+      "but": 128,
+      "ome": 129,
+      "fr": 130,
+      "ther": 131,
+      "fe": 132,
+      "su": 133,
+      "do": 134,
+      "con": 135,
+      "te": 136,
+      "ain": 137,
+      "ere": 138,
+      "po": 139,
+      "if": 140,
+      "they": 141,
+      "us": 142,
+      "ag": 143,
+      "tr": 144,
+      "now": 145,
+      "oun": 146,
+      "this": 147,
+      "have": 148,
+      "not": 149,
+      "sa": 150,
+      "il": 151,
+      "up": 152,
+      "thing": 153,
+      "from": 154,
+      "ap": 155,
+      "him": 156,
+      "ack": 157,
+      "ation": 158,
+      "ant": 159,
+      "our": 160,
+      "op": 161,
+      "like": 162,
+      "ust": 163,
+      "ess": 164,
+      "bo": 165,
+      "ok": 166,
+      "ul": 167,
+      "ind": 168,
+      "ex": 169,
+      "com": 170,
+      "some": 171,
+      "there": 172,
+      "ers": 173,
+      "co": 174,
+      "res": 175,
+      "man": 176,
+      "ard": 177,
+      "pl": 178,
+      "wor": 179,
+      "way": 180,
+      "tion": 181,
+      "fo": 182,
+      "ca": 183,
+      "were": 184,
+      "by": 185,
+      "ate": 186,
+      "pro": 187,
+      "ted": 188,
+      "ound": 189,
+      "own": 190,
+      "would": 191,
+      "ts": 192,
+      "what": 193,
+      "qu": 194,
+      "ally": 195,
+      "ight": 196,
+      "ck": 197,
+      "gr": 198,
+      "when": 199,
+      "ven": 200,
+      "can": 201,
+      "ough": 202,
+      "ine": 203,
+      "end": 204,
+      "per": 205,
+      "ous": 206,
+      "od": 207,
+      "ide": 208,
+      "know": 209,
+      "ty": 210,
+      "very": 211,
+      "si": 212,
+      "ak": 213,
+      "who": 214,
+      "about": 215,
+      "ill": 216,
+      "them": 217,
+      "est": 218,
+      "red": 219,
+      "ye": 220,
+      "could": 221,
+      "ong": 222,
+      "your": 223,
+      "their": 224,
+      "em": 225,
+      "just": 226,
+      "other": 227,
+      "into": 228,
+      "any": 229,
+      "whi": 230,
+      "um": 231,
+      "tw": 232,
+      "ast": 233,
+      "der": 234,
+      "did": 235,
+      "ie": 236,
+      "been": 237,
+      "ace": 238,
+      "ink": 239,
+      "ity": 240,
+      "back": 241,
+      "ting": 242,
+      "br": 243,
+      "more": 244,
+      "ake": 245,
+      "pp": 246,
+      "then": 247,
+      "sp": 248,
+      "el": 249,
+      "use": 250,
+      "bl": 251,
+      "said": 252,
+      "over": 253,
+      "get": 254,
+      "[START]": 255,
+      "\"": 256,
+      "#": 257,
+      "$": 258,
+      "%": 259,
+      "&": 260,
+      "*": 261,
+      "+": 262,
+      "0": 263,
+      "1": 264,
+      "2": 265,
+      "3": 266,
+      "4": 267,
+      "5": 268,
+      "6": 269,
+      "7": 270,
+      "8": 271,
+      "9": 272,
+      "<": 273,
+      "=": 274,
+      ">": 275,
+      "@": 276,
+      "A": 277,
+      "B": 278,
+      "C": 279,
+      "D": 280,
+      "E": 281,
+      "F": 282,
+      "G": 283,
+      "H": 284,
+      "I": 285,
+      "J": 286,
+      "K": 287,
+      "L": 288,
+      "M": 289,
+      "N": 290,
+      "O": 291,
+      "P": 292,
+      "Q": 293,
+      "R": 294,
+      "S": 295,
+      "T": 296,
+      "U": 297,
+      "V": 298,
+      "W": 299,
+      "X": 300,
+      "Y": 301,
+      "Z": 302,
+      "[": 303,
+      "\\": 304,
+      "]": 305,
+      "^": 306,
+      "_": 307,
+      "`": 308,
+      "{": 309,
+      "|": 310,
+      "}": 311,
+      "~": 312,
+      "‐": 313,
+      "‑": 314,
+      "‒": 315,
+      "–": 316,
+      "—": 317,
+      "―": 318,
+      "‖": 319,
+      "‗": 320,
+      "‘": 321,
+      "’": 322,
+      "‚": 323,
+      "‛": 324,
+      "“": 325,
+      "”": 326,
+      "„": 327,
+      "‟": 328,
+      " ": 329,
+      "¡": 330,
+      "¢": 331,
+      "£": 332,
+      "¤": 333,
+      "¥": 334,
+      "¦": 335,
+      "§": 336,
+      "¨": 337,
+      "©": 338,
+      "ª": 339,
+      "«": 340,
+      "¬": 341,
+      "­": 342,
+      "®": 343,
+      "¯": 344,
+      "°": 345,
+      "±": 346,
+      "²": 347,
+      "³": 348,
+      "´": 349,
+      "µ": 350,
+      "¶": 351,
+      "·": 352,
+      "¸": 353,
+      "¹": 354,
+      "º": 355,
+      "»": 356,
+      "¼": 357,
+      "½": 358,
+      "¾": 359,
+      "¿": 360,
+      "À": 361,
+      "Á": 362,
+      "Â": 363,
+      "Ã": 364,
+      "Ä": 365,
+      "Å": 366,
+      "Æ": 367,
+      "Ç": 368,
+      "È": 369,
+      "É": 370,
+      "Ê": 371,
+      "Ë": 372,
+      "Ì": 373,
+      "Í": 374,
+      "Î": 375,
+      "Ï": 376,
+      "Ð": 377,
+      "Ñ": 378,
+      "Ò": 379,
+      "Ó": 380,
+      "Ô": 381,
+      "Õ": 382,
+      "Ö": 383,
+      "×": 384,
+      "Ø": 385,
+      "Ù": 386,
+      "Ú": 387,
+      "Û": 388,
+      "Ü": 389,
+      "Ý": 390,
+      "Þ": 391,
+      "ß": 392,
+      "à": 393,
+      "á": 394,
+      "â": 395,
+      "ã": 396,
+      "ä": 397,
+      "å": 398,
+      "æ": 399,
+      "ç": 400,
+      "è": 401,
+      "é": 402,
+      "ê": 403,
+      "ë": 404,
+      "ì": 405,
+      "í": 406,
+      "î": 407,
+      "ï": 408,
+      "ð": 409,
+      "ñ": 410,
+      "ò": 411,
+      "ó": 412,
+      "ô": 413,
+      "õ": 414,
+      "ö": 415,
+      "÷": 416,
+      "ø": 417,
+      "ù": 418,
+      "ú": 419,
+      "û": 420,
+      "ü": 421,
+      "ý": 422,
+      "þ": 423,
+      "ÿ": 424,
+      "ɐ": 425,
+      "ɑ": 426,
+      "ɒ": 427,
+      "ɓ": 428,
+      "ɔ": 429,
+      "ɕ": 430,
+      "ɖ": 431,
+      "ɗ": 432,
+      "ɘ": 433,
+      "ə": 434,
+      "ɚ": 435,
+      "ɛ": 436,
+      "ɜ": 437,
+      "ɝ": 438,
+      "ɞ": 439,
+      "ɟ": 440,
+      "ɠ": 441,
+      "ɡ": 442,
+      "ɢ": 443,
+      "ɣ": 444,
+      "ɤ": 445,
+      "ɥ": 446,
+      "ɦ": 447,
+      "ɧ": 448,
+      "ɨ": 449,
+      "ɩ": 450,
+      "ɪ": 451,
+      "ɫ": 452,
+      "ɬ": 453,
+      "ɭ": 454,
+      "ɮ": 455,
+      "ɯ": 456,
+      "ɰ": 457,
+      "ɱ": 458,
+      "ɲ": 459,
+      "ɳ": 460,
+      "ɴ": 461,
+      "ɵ": 462,
+      "ɶ": 463,
+      "ɷ": 464,
+      "ɸ": 465,
+      "ɹ": 466,
+      "ɺ": 467,
+      "ɻ": 468,
+      "ɼ": 469,
+      "ɽ": 470,
+      "ɾ": 471,
+      "ɿ": 472,
+      "ʀ": 473,
+      "ʁ": 474,
+      "ʂ": 475,
+      "ʃ": 476,
+      "ʄ": 477,
+      "ʅ": 478,
+      "ʆ": 479,
+      "ʇ": 480,
+      "ʈ": 481,
+      "ʉ": 482,
+      "ʊ": 483,
+      "ʋ": 484,
+      "ʌ": 485,
+      "ʍ": 486,
+      "ʎ": 487,
+      "ʏ": 488,
+      "ʐ": 489,
+      "ʑ": 490,
+      "ʒ": 491,
+      "ʓ": 492,
+      "ʔ": 493,
+      "ʕ": 494,
+      "ʖ": 495,
+      "ʗ": 496,
+      "ʘ": 497,
+      "ʙ": 498,
+      "ʚ": 499,
+      "ʛ": 500,
+      "ʜ": 501,
+      "ʝ": 502,
+      "ʞ": 503,
+      "ʟ": 504,
+      "ʠ": 505,
+      "ʡ": 506,
+      "ʢ": 507,
+      "ʣ": 508,
+      "ʤ": 509,
+      "ʥ": 510,
+      "ʦ": 511,
+      "ʧ": 512,
+      "ʨ": 513,
+      "ʩ": 514,
+      "ʪ": 515,
+      "ʫ": 516,
+      "ʬ": 517,
+      "ʭ": 518,
+      "ʮ": 519,
+      "ʯ": 520,
+      "ʰ": 521,
+      "ʱ": 522,
+      "ʲ": 523,
+      "ʳ": 524,
+      "ʴ": 525,
+      "ʵ": 526,
+      "ʶ": 527,
+      "ʷ": 528,
+      "ʸ": 529,
+      "ʹ": 530,
+      "ʺ": 531,
+      "ʻ": 532,
+      "ʼ": 533,
+      "ʽ": 534,
+      "ʾ": 535,
+      "ʿ": 536,
+      "ˀ": 537,
+      "ˁ": 538,
+      "˂": 539,
+      "˃": 540,
+      "˄": 541,
+      "˅": 542,
+      "ˆ": 543,
+      "ˇ": 544,
+      "ˈ": 545,
+      "ˉ": 546,
+      "ˊ": 547,
+      "ˋ": 548,
+      "ˌ": 549,
+      "ˍ": 550,
+      "ˎ": 551,
+      "ˏ": 552,
+      "ː": 553,
+      "ˑ": 554,
+      "˒": 555,
+      "˓": 556,
+      "˔": 557,
+      "˕": 558,
+      "˖": 559,
+      "˗": 560,
+      "˘": 561,
+      "˙": 562,
+      "˚": 563,
+      "˛": 564,
+      "˜": 565,
+      "˝": 566,
+      "˞": 567,
+      "˟": 568,
+      "ˠ": 569,
+      "ˡ": 570,
+      "ˢ": 571,
+      "ˣ": 572,
+      "ˤ": 573,
+      "˥": 574,
+      "˦": 575,
+      "˧": 576,
+      "˨": 577,
+      "˩": 578,
+      "˪": 579,
+      "˫": 580,
+      "ˬ": 581,
+      "˭": 582,
+      "ˮ": 583,
+      "˯": 584,
+      "˰": 585,
+      "˱": 586,
+      "˲": 587,
+      "˳": 588,
+      "˴": 589,
+      "˵": 590,
+      "˶": 591,
+      "˷": 592,
+      "˸": 593,
+      "˹": 594,
+      "˺": 595,
+      "˻": 596,
+      "˼": 597,
+      "˽": 598,
+      "˾": 599,
+      "˿": 600,
+      "ā": 601,
+      "ō": 602,
+      "…": 603,
+      "[UH]": 604,
+      "[UM]": 605,
+      "[giggle]": 606,
+      "[laughter]": 607,
+      "[guffaw]": 608,
+      "[inhale]": 609,
+      "[exhale]": 610,
+      "[sigh]": 611,
+      "[cry]": 612,
+      "[bark]": 613,
+      "[howl]": 614,
+      "[meow]": 615,
+      "[singing]": 616,
+      "[music]": 617,
+      "[whistle]": 618,
+      "[humming]": 619,
+      "[gasp]": 620,
+      "[groan]": 621,
+      "[whisper]": 622,
+      "[mumble]": 623,
+      "[sniff]": 624,
+      "[sneeze]": 625,
+      "[cough]": 626,
+      "[snore]": 627,
+      "[chew]": 628,
+      "[sip]": 629,
+      "[clear_throat]": 630,
+      "[kiss]": 631,
+      "[shhh]": 632,
+      "[gibberish]": 633,
+      "[fr]": 634,
+      "[es]": 635,
+      "[de]": 636,
+      "[it]": 637,
+      "[ipa]": 638,
+      "[end_of_label]": 639,
+      "ŋ": 640,
+      "ᵻ": 641,
+      "θ": 642,
+      "̩": 643,
+      "\u0303": 644,
+      "ɑː": 645,
+      "iː": 646,
+      "uː": 647,
+      "ɜː": 648,
+      "ɔː": 649,
+      "oː": 650,
+      "eɪ": 651,
+      "oʊ": 652,
+      "aɪ": 653,
+      "aʊ": 654,
+      "ɔɪ": 655,
+      "dʒ": 656,
+      "tʃ": 657,
+      "ɪŋ": 658,
+      "ᵻd": 659,
+      "ˈiː": 660,
+      "ˌiː": 661,
+      "ˈɪ": 662,
+      "ˌɪ": 663,
+      "ˈeɪ": 664,
+      "ˌeɪ": 665,
+      "ˈɛ": 666,
+      "ˌɛ": 667,
+      "ˈæ": 668,
+      "ˌæ": 669,
+      "ˈɑː": 670,
+      "ˌɑː": 671,
+      "ˈɔː": 672,
+      "ˌɔː": 673,
+      "oːɹ": 674,
+      "ˈoːɹ": 675,
+      "ˌoːɹ": 676,
+      "ˈoʊ": 677,
+      "ˌoʊ": 678,
+      "ˈʊ": 679,
+      "ˌʊ": 680,
+      "ˈuː": 681,
+      "ˌuː": 682,
+      "ˈɜː": 683,
+      "ˌɜː": 684,
+      "ˈʌ": 685,
+      "ˌʌ": 686,
+      "ˈaɪ": 687,
+      "ˌaɪ": 688,
+      "ˈaʊ": 689,
+      "ˌaʊ": 690,
+      "ˈɔɪ": 691,
+      "ˌɔɪ": 692,
+      "ˈɚ": 693,
+      "ˌɐ": 694,
+      "[PLACEHOLDER55]": 695,
+      "[PLACEHOLDER56]": 696,
+      "[PLACEHOLDER57]": 697,
+      "[PLACEHOLDER58]": 698,
+      "[PLACEHOLDER59]": 699,
+      "[PLACEHOLDER60]": 700,
+      "[PLACEHOLDER61]": 701,
+      "[PLACEHOLDER62]": 702,
+      "[PLACEHOLDER63]": 703
+    },
+    "merges": [
+      "t h",
+      "i n",
+      "th e",
+      "a n",
+      "e r",
+      "o u",
+      "r e",
+      "o n",
+      "a t",
+      "e d",
+      "e n",
+      "t o",
+      "in g",
+      "an d",
+      "i s",
+      "a s",
+      "a l",
+      "o r",
+      "o f",
+      "a r",
+      "i t",
+      "e s",
+      "h e",
+      "s t",
+      "l e",
+      "o m",
+      "s e",
+      "b e",
+      "a d",
+      "o w",
+      "l y",
+      "c h",
+      "w h",
+      "th at",
+      "y ou",
+      "l i",
+      "v e",
+      "a c",
+      "t i",
+      "l d",
+      "m e",
+      "w as",
+      "g h",
+      "i d",
+      "l l",
+      "w i",
+      "en t",
+      "f or",
+      "a y",
+      "r o",
+      "v er",
+      "i c",
+      "h er",
+      "k e",
+      "h is",
+      "n o",
+      "u t",
+      "u n",
+      "i r",
+      "l o",
+      "w e",
+      "r i",
+      "h a",
+      "wi th",
+      "gh t",
+      "ou t",
+      "i m",
+      "i on",
+      "al l",
+      "a b",
+      "on e",
+      "n e",
+      "g e",
+      "ou ld",
+      "t er",
+      "m o",
+      "h ad",
+      "c e",
+      "s he",
+      "g o",
+      "s h",
+      "u r",
+      "a m",
+      "s o",
+      "p e",
+      "m y",
+      "d e",
+      "a re",
+      "b ut",
+      "om e",
+      "f r",
+      "the r",
+      "f e",
+      "s u",
+      "d o",
+      "c on",
+      "t e",
+      "a in",
+      "er e",
+      "p o",
+      "i f",
+      "the y",
+      "u s",
+      "a g",
+      "t r",
+      "n ow",
+      "ou n",
+      "th is",
+      "ha ve",
+      "no t",
+      "s a",
+      "i l",
+      "u p",
+      "th ing",
+      "fr om",
+      "a p",
+      "h im",
+      "ac k",
+      "at ion",
+      "an t",
+      "ou r",
+      "o p",
+      "li ke",
+      "u st",
+      "es s",
+      "b o",
+      "o k",
+      "u l",
+      "in d",
+      "e x",
+      "c om",
+      "s ome",
+      "the re",
+      "er s",
+      "c o",
+      "re s",
+      "m an",
+      "ar d",
+      "p l",
+      "w or",
+      "w ay",
+      "ti on",
+      "f o",
+      "c a",
+      "w ere",
+      "b y",
+      "at e",
+      "p ro",
+      "t ed",
+      "oun d",
+      "ow n",
+      "w ould",
+      "t s",
+      "wh at",
+      "q u",
+      "al ly",
+      "i ght",
+      "c k",
+      "g r",
+      "wh en",
+      "v en",
+      "c an",
+      "ou gh",
+      "in e",
+      "en d",
+      "p er",
+      "ou s",
+      "o d",
+      "id e",
+      "k now",
+      "t y",
+      "ver y",
+      "s i",
+      "a k",
+      "wh o",
+      "ab out",
+      "i ll",
+      "the m",
+      "es t",
+      "re d",
+      "y e",
+      "c ould",
+      "on g",
+      "you r",
+      "the ir",
+      "e m",
+      "j ust",
+      "o ther",
+      "in to",
+      "an y",
+      "wh i",
+      "u m",
+      "t w",
+      "as t",
+      "d er",
+      "d id",
+      "i e",
+      "be en",
+      "ac e",
+      "in k",
+      "it y",
+      "b ack",
+      "t ing",
+      "b r",
+      "mo re",
+      "a ke",
+      "p p",
+      "the n",
+      "s p",
+      "e l",
+      "u se",
+      "b l",
+      "sa id",
+      "o ver",
+      "ge t",
+      "ɑ ː",
+      "i ː",
+      "u ː",
+      "ɜ ː",
+      "ɔ ː",
+      "o ː",
+      "e ɪ",
+      "o ʊ",
+      "a ɪ",
+      "a ʊ",
+      "ɔ ɪ",
+      "d ʒ",
+      "t ʃ",
+      "ɪ ŋ",
+      "ᵻ d",
+      "ˈ iː",
+      "ˌ iː",
+      "ˈ ɪ",
+      "ˌ ɪ",
+      "ˈ eɪ",
+      "ˌ eɪ",
+      "ˈ ɛ",
+      "ˌ ɛ",
+      "ˈ æ",
+      "ˌ æ",
+      "ˈ ɑː",
+      "ˌ ɑː",
+      "ˈ ɔː",
+      "ˌ ɔː",
+      "oː ɹ",
+      "ˈ oːɹ",
+      "ˌ oːɹ",
+      "ˈ oʊ",
+      "ˌ oʊ",
+      "ˈ ʊ",
+      "ˌ ʊ",
+      "ˈ uː",
+      "ˌ uː",
+      "ˈ ɜː",
+      "ˌ ɜː",
+      "ˈ ʌ",
+      "ˌ ʌ",
+      "ˈ aɪ",
+      "ˌ aɪ",
+      "ˈ aʊ",
+      "ˌ aʊ",
+      "ˈ ɔɪ",
+      "ˌ ɔɪ",
+      "ˈ ɚ",
+      "ˌ ɐ"
+    ]
+  }
+}
\ No newline at end of file
diff --git a/ve.pt b/ve.pt
new file mode 100644
index 0000000..0dc4fd5
--- /dev/null
+++ b/ve.pt
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bb3eff0c44056b0ff155fba8568eef9241e15e5c6d703f3de86f69ab56bc1e94
+size 132