Skip to content

Commit 412f395

Browse files
authored
Add Kimi Audio (#495)
* Fix React-Gradio file proxy missing slash * add flash-attn installers * add gitignore for kimi-audio * add kimi audio experiment * fix date, organize requirements * reclassify kimi_audio as tools and add extension_kokoro_tts_api * cleanup
1 parent d929cdc commit 412f395

File tree

5 files changed

+44
-1
lines changed

5 files changed

+44
-1
lines changed

.gitignore

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -40,6 +40,7 @@ extensions.external.json
4040
/data/models/ap_bwe/weights/
4141
/data/models/openvoice/
4242
/data/models/openvoice_v2/
43+
/data/models/kimi-audio/
4344

4445
# Ignore temporary files
4546
temp/

README.md

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -80,6 +80,13 @@
8080

8181
## Changelog
8282

83+
May 6:
84+
* Add Kimi Audio 7B Instruct extension
85+
* Fix React-Gradio file proxy missing slash
86+
* Add Kokoro TTS API extension
87+
88+
## April 2025
89+
8390
Apr 25:
8491
* Add OpenVoice V2 extension
8592

extensions.json

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -597,6 +597,36 @@
597597
"website": "https://github.com/myshell-ai/OpenVoice",
598598
"extension_website": "https://github.com/rsxdalv/extension_openvoice_v2",
599599
"extension_platform_version": "0.0.1"
600+
},
601+
{
602+
"package_name": "extension_kimi_audio",
603+
"name": "Kimi Audio",
604+
"version": "0.0.1",
605+
"requirements": "git+https://github.com/rsxdalv/extension_kimi_audio@main",
606+
"description": "Kimi Audio is a powerful text-to-speech and speech-to-text model by Moonshot AI",
607+
"extension_type": "interface",
608+
"extension_class": "tools",
609+
"author": "Moonshot AI",
610+
"extension_author": "rsxdalv",
611+
"license": "MIT",
612+
"website": "https://github.com/moonshotai/Kimi-Audio",
613+
"extension_website": "https://github.com/rsxdalv/extension_kimi_audio",
614+
"extension_platform_version": "0.0.1"
615+
},
616+
{
617+
"package_name": "extension_kokoro_tts_api",
618+
"name": "Kokoro TTS API",
619+
"version": "0.0.1",
620+
"requirements": "git+https://github.com/rsxdalv/extension_kokoro_tts_api@main",
621+
"description": "Kokoro TTS API is a text-to-speech model by hexgrad",
622+
"extension_type": "interface",
623+
"extension_class": "tools",
624+
"author": "hexgrad",
625+
"extension_author": "rsxdalv",
626+
"license": "MIT",
627+
"website": "https://huggingface.co/hexgrad/Kokoro-82M",
628+
"extension_website": "https://github.com/rsxdalv/extension_kokoro_tts_api",
629+
"extension_platform_version": "0.0.1"
600630
}
601631
],
602632
"decorators": [

requirements.txt

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15,8 +15,13 @@ fairseq @ https://github.com/rsxdalv/fairseq/releases/download/v0.12.3/fairseq-0
1515
fairseq @ https://github.com/rsxdalv/fairseq/releases/download/v0.12.3/fairseq-0.12.13-cp310-cp310-macosx_11_0_universal2.whl ; sys_platform == 'darwin' # MIT License
1616
accelerate>=0.33.0
1717
# optimum-quanto==0.2.6
18+
19+
# experimental
1820
# triton>=3.2.0 ; sys_platform == 'linux',
1921
# triton-windows>=3.2.0.post18 ; sys_platform == 'win32',
22+
# flash-attn @ https://github.com/kingbri1/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu124torch2.6.0cxx11abiFALSE-cp310-cp310-win_amd64.whl ; sys_platform == 'win32'
23+
# flash-attn @ https://github.com/Dao-AILab/flash-attention/releases/download/v2.7.4.post1/flash_attn-2.7.4.post1+cu12torch2.6cxx11abiFALSE-cp310-cp310-linux_x86_64.whl ; sys_platform == 'linux'
24+
2025

2126
extension_bark @ git+https://github.com/rsxdalv/extension_bark@main
2227
extension_tortoise @ git+https://github.com/rsxdalv/extension_tortoise@main

server.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -257,7 +257,7 @@ def signal_handler(signal, frame, postgres_process):
257257
"npm start --prefix react-ui",
258258
env={
259259
**os.environ,
260-
"GRADIO_BACKEND_AUTOMATIC": f"http://127.0.0.1:{gradio_interface_options['server_port']}",
260+
"GRADIO_BACKEND_AUTOMATIC": f"http://127.0.0.1:{gradio_interface_options['server_port']}/",
261261
},
262262
shell=True,
263263
)

0 commit comments

Comments
 (0)