csukuangfj commited on
Commit
72e7095
·
1 Parent(s): cd45a1d

Add kitten

Browse files
Files changed (1) hide show
  1. model.py +46 -0
model.py CHANGED
@@ -119,6 +119,51 @@ def _get_vits_ljs(repo_id: str, speed: float) -> sherpa_onnx.OfflineTts:
119
  return tts
120
 
121
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
122
  @lru_cache(maxsize=10)
123
  def _get_kokoro(repo_id: str, speed: float) -> sherpa_onnx.OfflineTts:
124
  data_dir = "/tmp/espeak-ng-data"
@@ -695,6 +740,7 @@ chinese_models = {
695
 
696
  english_models = {
697
  "csukuangfj/kokoro-en-v0_19|11 speakers": _get_kokoro,
 
698
  "csukuangfj/vits-piper-en_US-glados-high|1 speaker": _get_vits_piper,
699
  "csukuangfj/vits-piper-en_US-glados|1 speaker": _get_vits_piper,
700
  "csukuangfj/vits-piper-en_GB-southern_english_male-medium|8 speakers": _get_vits_piper,
 
119
  return tts
120
 
121
 
122
+ @lru_cache(maxsize=10)
123
+ def _get_kitten(repo_id: str, speed: float) -> sherpa_onnx.OfflineTts:
124
+ data_dir = "/tmp/espeak-ng-data"
125
+ repo_id = repo_id.split("|")[0]
126
+ assert repo_id in ("csukuangfj/kitten-nano-en-v0_1-fp16",), repo_id
127
+
128
+ model = get_file(
129
+ repo_id=repo_id,
130
+ filename="model.fp16.onnx",
131
+ subfolder=".",
132
+ )
133
+
134
+ tokens = get_file(
135
+ repo_id=repo_id,
136
+ filename="tokens.txt",
137
+ subfolder=".",
138
+ )
139
+
140
+ voices = get_file(
141
+ repo_id=repo_id,
142
+ filename="voices.bin",
143
+ subfolder=".",
144
+ )
145
+
146
+ tts_config = sherpa_onnx.OfflineTtsConfig(
147
+ model=sherpa_onnx.OfflineTtsModelConfig(
148
+ kitten=sherpa_onnx.OfflineTtsKittenModelConfig(
149
+ model=model,
150
+ voices=voices,
151
+ tokens=tokens,
152
+ data_dir=data_dir,
153
+ length_scale=1.0 / speed,
154
+ ),
155
+ provider="cpu",
156
+ debug=True,
157
+ num_threads=2,
158
+ ),
159
+ max_num_sentences=1,
160
+ )
161
+
162
+ tts = sherpa_onnx.OfflineTts(tts_config)
163
+
164
+ return tts
165
+
166
+
167
  @lru_cache(maxsize=10)
168
  def _get_kokoro(repo_id: str, speed: float) -> sherpa_onnx.OfflineTts:
169
  data_dir = "/tmp/espeak-ng-data"
 
740
 
741
  english_models = {
742
  "csukuangfj/kokoro-en-v0_19|11 speakers": _get_kokoro,
743
+ "csukuangfj/kitten-nano-en-v0_1-fp16|8 speakers": _get_kitten,
744
  "csukuangfj/vits-piper-en_US-glados-high|1 speaker": _get_vits_piper,
745
  "csukuangfj/vits-piper-en_US-glados|1 speaker": _get_vits_piper,
746
  "csukuangfj/vits-piper-en_GB-southern_english_male-medium|8 speakers": _get_vits_piper,