Spaces:
Running
Running
Commit
·
69c8f4a
1
Parent(s):
83155e1
initial_commit
Browse files- Dockerfile +17 -0
- LICENSE +21 -0
- SECURITY.md +14 -0
- pyproject.toml +45 -0
- requirements.txt +17 -0
Dockerfile
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
FROM python:3.10-slim
|
| 2 |
+
WORKDIR /app
|
| 3 |
+
RUN apt-get update && apt-get install -y \
|
| 4 |
+
libsndfile1 \
|
| 5 |
+
ffmpeg \
|
| 6 |
+
git \
|
| 7 |
+
&& rm -rf /var/lib/apt/lists/*
|
| 8 |
+
|
| 9 |
+
COPY requirements.txt .
|
| 10 |
+
RUN pip install --no-cache-dir -r requirements.txt
|
| 11 |
+
|
| 12 |
+
|
| 13 |
+
COPY . .
|
| 14 |
+
RUN pip install -e .
|
| 15 |
+
EXPOSE 7860
|
| 16 |
+
WORKDIR /app/demo
|
| 17 |
+
CMD ["python3", "vibevoice_realtime_demo.py", "--model_path", "../models/VibeVoice-Realtime-0.5B", "--port", "7860", "--device", "cpu"]
|
LICENSE
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
MIT License
|
| 2 |
+
|
| 3 |
+
Copyright (c) 2025 Microsoft
|
| 4 |
+
|
| 5 |
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
| 6 |
+
of this software and associated documentation files (the "Software"), to deal
|
| 7 |
+
in the Software without restriction, including without limitation the rights
|
| 8 |
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
| 9 |
+
copies of the Software, and to permit persons to whom the Software is
|
| 10 |
+
furnished to do so, subject to the following conditions:
|
| 11 |
+
|
| 12 |
+
The above copyright notice and this permission notice shall be included in all
|
| 13 |
+
copies or substantial portions of the Software.
|
| 14 |
+
|
| 15 |
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
| 16 |
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
| 17 |
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
| 18 |
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
| 19 |
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
| 20 |
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
| 21 |
+
SOFTWARE.
|
SECURITY.md
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
<!-- BEGIN MICROSOFT SECURITY.MD V1.0.0 BLOCK -->
|
| 2 |
+
|
| 3 |
+
## Security
|
| 4 |
+
|
| 5 |
+
Microsoft takes the security of our software products and services seriously, which
|
| 6 |
+
includes all source code repositories in our GitHub organizations.
|
| 7 |
+
|
| 8 |
+
**Please do not report security vulnerabilities through public GitHub issues.**
|
| 9 |
+
|
| 10 |
+
For security reporting information, locations, contact information, and policies,
|
| 11 |
+
please review the latest guidance for Microsoft repositories at
|
| 12 |
+
[https://aka.ms/SECURITY.md](https://aka.ms/SECURITY.md).
|
| 13 |
+
|
| 14 |
+
<!-- END MICROSOFT SECURITY.MD BLOCK -->
|
pyproject.toml
ADDED
|
@@ -0,0 +1,45 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[build-system]
|
| 2 |
+
requires = ["setuptools>=61.0"]
|
| 3 |
+
build-backend = "setuptools.build_meta"
|
| 4 |
+
|
| 5 |
+
[project]
|
| 6 |
+
name = "vibevoice"
|
| 7 |
+
version = "0.0.1"
|
| 8 |
+
authors = [
|
| 9 |
+
{ name="vibevoice team", email="[email protected]" },
|
| 10 |
+
]
|
| 11 |
+
description = "A model for speech generation with an AR + diffusion architecture."
|
| 12 |
+
readme = "README.md"
|
| 13 |
+
requires-python = ">=3.9"
|
| 14 |
+
classifiers = [
|
| 15 |
+
"Programming Language :: Python :: 3",
|
| 16 |
+
# "License :: OSI Approved :: MIT License",
|
| 17 |
+
"Operating System :: OS Independent",
|
| 18 |
+
]
|
| 19 |
+
dependencies = [
|
| 20 |
+
"torch",
|
| 21 |
+
"accelerate==1.6.0",
|
| 22 |
+
"transformers==4.51.3", # we develop this project on transformers==4.51.3, later version may not be compatible
|
| 23 |
+
"llvmlite>=0.40.0",
|
| 24 |
+
"numba>=0.57.0",
|
| 25 |
+
"diffusers",
|
| 26 |
+
"tqdm",
|
| 27 |
+
"numpy",
|
| 28 |
+
"scipy",
|
| 29 |
+
"librosa",
|
| 30 |
+
"ml-collections",
|
| 31 |
+
"absl-py",
|
| 32 |
+
"gradio",
|
| 33 |
+
"av",
|
| 34 |
+
"aiortc",
|
| 35 |
+
"uvicorn[standard]",
|
| 36 |
+
"fastapi"
|
| 37 |
+
]
|
| 38 |
+
|
| 39 |
+
|
| 40 |
+
[project.urls]
|
| 41 |
+
"Homepage" = "https://github.com/microsoft/VibeVoice"
|
| 42 |
+
"Bug Tracker" = "https://github.com/microsoft/VibeVoice/issues"
|
| 43 |
+
|
| 44 |
+
[tool.setuptools.packages.find]
|
| 45 |
+
where = ["."]
|
requirements.txt
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
torch
|
| 2 |
+
accelerate==1.6.0
|
| 3 |
+
transformers==4.51.3
|
| 4 |
+
llvmlite>=0.40.0
|
| 5 |
+
numba>=0.57.0
|
| 6 |
+
diffusers
|
| 7 |
+
tqdm
|
| 8 |
+
numpy
|
| 9 |
+
scipy
|
| 10 |
+
librosa
|
| 11 |
+
ml-collections
|
| 12 |
+
absl-py
|
| 13 |
+
gradio
|
| 14 |
+
av
|
| 15 |
+
aiortc
|
| 16 |
+
uvicorn[standard]
|
| 17 |
+
fastapi
|