TTS-ORG
/

OmniVoice_sync_data_and_code

Model card Files Files and versions

Metrics Training metrics Community

OmniVoice_sync_data_and_code / pyproject.toml

Abdelrahman2922's picture

Abdelrahman2922

Add files using upload-large-folder tool

a4d9876 verified 26 days ago

history blame contribute delete

2.69 kB

	[build-system]
	requires = ["hatchling"]
	build-backend = "hatchling.build"

	[project]
	name = "omnivoice"
	version = "0.1.5"
	description = "OmniVoice: Towards Omnilingual Zero-Shot Text-to-Speech with Diffusion Language Models"
	readme = "README.md"
	license = "Apache-2.0"
	requires-python = ">=3.10"
	authors = [{name = "Han Zhu"}]
	keywords = [
	"tts",
	"text-to-speech",
	"speech-synthesis",
	"zero-shot",
	"multilingual",
	"diffusion",
	"voice-cloning",
	]
	classifiers = [
	"Intended Audience :: Science/Research",
	"Intended Audience :: Developers",

	"Topic :: Scientific/Engineering :: Artificial Intelligence",
	"Topic :: Multimedia :: Sound/Audio :: Speech",

	"Operating System :: OS Independent",
	"Programming Language :: Python :: 3",
	]
	dependencies = [
	"torch>=2.4",
	"torchaudio>=2.4",
	"transformers>=5.3.0",
	"accelerate",
	"pydub",
	"gradio",
	"tensorboardX",
	"webdataset",
	"numpy",
	"soundfile",
	"librosa",
	"uvicorn>=0.42.0",
	"fastapi>=0.135.2",
	]

	[project.optional-dependencies]

	eval = [
	"jiwer==3.1.0", # WER
	"s3prl", # Speech representation (HuBERT etc.)
	"funasr", # ASR models
	"zhconv", # Chinese character normalization
	"zhon", # Chinese punctuation
	"unidecode", # Unicode normalization
	]

	[project.scripts]
	omnivoice-infer = "omnivoice.cli.infer:main"
	omnivoice-infer-batch = "omnivoice.cli.infer_batch:main"
	omnivoice-demo = "omnivoice.cli.demo:main"

	[project.urls]
	Homepage = "https://github.com/k2-fsa/OmniVoice"
	Repository = "https://github.com/k2-fsa/OmniVoice"
	"Bug Tracker" = "https://github.com/k2-fsa/OmniVoice/issues"

	[tool.uv.sources]
	# Install PyTorch with CUDA support on Linux/Windows (CUDA doesn't exist for Mac).
	# NOTE: We must explicitly request them as `dependencies` above. These improved
	# versions will not be selected if they're only third-party dependencies.
	torch = [
	{ index = "pytorch-cuda", marker = "sys_platform == 'linux' or sys_platform == 'win32'" },
	]
	torchaudio = [
	{ index = "pytorch-cuda", marker = "sys_platform == 'linux' or sys_platform == 'win32'" },
	]

	[[tool.uv.index]]
	name = "pytorch-cuda"
	# Use PyTorch built for NVIDIA Toolkit version 12.8.
	# Available versions: https://pytorch.org/get-started/locally/
	url = "https://download.pytorch.org/whl/cu128"
	# Only use this index when explicitly requested by `tool.uv.sources`.
	explicit = true

	[tool.uv]
	constraint-dependencies = [
	"torch==2.8.0",
	"torchaudio==2.8.0",
	]

	[tool.hatch.build.targets.sdist]
	include = ["omnivoice"]

	[tool.hatch.build.targets.wheel]
	packages = ["omnivoice"]