diff --git a/.gitmodules b/.gitmodules index 4831b09..9a8a7b3 100644 --- a/.gitmodules +++ b/.gitmodules @@ -1,3 +1,4 @@ [submodule "kimia_infer/models/tokenizer/glm4"] path = kimia_infer/models/tokenizer/glm4 - url = https://github.com/THUDM/GLM-4-Voice.git + url = https://github.com/rsxdalv/GLM-4-Voice.git + branch = speech_tokenizer diff --git a/kimia_infer/models/detokenizer/flow_matching/__init__.py b/kimia_infer/models/detokenizer/flow_matching/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/kimia_infer/models/detokenizer/vocoder/__init__.py b/kimia_infer/models/detokenizer/vocoder/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/kimia_infer/models/tokenizer/glm4 b/kimia_infer/models/tokenizer/glm4 index eb00ce9..4a3ff00 160000 --- a/kimia_infer/models/tokenizer/glm4 +++ b/kimia_infer/models/tokenizer/glm4 @@ -1 +1 @@ -Subproject commit eb00ce9142e8d98b0ed7c57cd47e0d6d5dce9a1a +Subproject commit 4a3ff00a81b37008a66788904f6f8c084263b85c diff --git a/kimia_infer/models/tokenizer/whisper_Lv3/__init__.py b/kimia_infer/models/tokenizer/whisper_Lv3/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/setup.py b/setup.py new file mode 100644 index 0000000..2902d4e --- /dev/null +++ b/setup.py @@ -0,0 +1,60 @@ +from setuptools import setup, find_packages + +setup( + name="kimia_infer", + version="0.1.6", + description="Kimi-Audio inference and toolkit package.", + author="Moonshot AI", + packages=find_packages(), + install_requires=[ + "torch>=2.4.1", + "torchaudio>=2.4.1", + "packaging", + "jinja2", + "openai-whisper", + "jsonlines", + "pandas", + "validators", + "sty", + "transformers", + "librosa", + "accelerate", + "aiohttp", + "colorama", + "omegaconf>=2.3.0", + "sox", + "six>=1.16.0", + "hyperpyyaml", + "conformer>=0.3.2", + "diffusers", + "pillow", + "sentencepiece", + "easydict", + "fire", + "ujson", + "cairosvg", + "immutabledict", + "rich", + "wget", + "gdown", + "datasets", + "torchdyn>=1.0.6", + "huggingface_hub", + "loguru", + "decord", + "blobfile", + "timm", + "sacrebleu>=1.5.1", + "soundfile", + "tqdm" + ], + include_package_data=True, + package_data={ + 'kimia_infer.models.detokenizer.vocoder.alias_free_activation': [ + 'cuda/*.h', + 'cuda/*.cu', + 'cuda/*.cpp' + ] + }, + python_requires=">=3.8", +)