ChaitanyaChandra commited on
Commit
69c8f4a
·
1 Parent(s): 83155e1

initial_commit

Browse files
Files changed (5) hide show
  1. Dockerfile +17 -0
  2. LICENSE +21 -0
  3. SECURITY.md +14 -0
  4. pyproject.toml +45 -0
  5. requirements.txt +17 -0
Dockerfile ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM python:3.10-slim
2
+ WORKDIR /app
3
+ RUN apt-get update && apt-get install -y \
4
+ libsndfile1 \
5
+ ffmpeg \
6
+ git \
7
+ && rm -rf /var/lib/apt/lists/*
8
+
9
+ COPY requirements.txt .
10
+ RUN pip install --no-cache-dir -r requirements.txt
11
+
12
+
13
+ COPY . .
14
+ RUN pip install -e .
15
+ EXPOSE 7860
16
+ WORKDIR /app/demo
17
+ CMD ["python3", "vibevoice_realtime_demo.py", "--model_path", "../models/VibeVoice-Realtime-0.5B", "--port", "7860", "--device", "cpu"]
LICENSE ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ MIT License
2
+
3
+ Copyright (c) 2025 Microsoft
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
SECURITY.md ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!-- BEGIN MICROSOFT SECURITY.MD V1.0.0 BLOCK -->
2
+
3
+ ## Security
4
+
5
+ Microsoft takes the security of our software products and services seriously, which
6
+ includes all source code repositories in our GitHub organizations.
7
+
8
+ **Please do not report security vulnerabilities through public GitHub issues.**
9
+
10
+ For security reporting information, locations, contact information, and policies,
11
+ please review the latest guidance for Microsoft repositories at
12
+ [https://aka.ms/SECURITY.md](https://aka.ms/SECURITY.md).
13
+
14
+ <!-- END MICROSOFT SECURITY.MD BLOCK -->
pyproject.toml ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [build-system]
2
+ requires = ["setuptools>=61.0"]
3
+ build-backend = "setuptools.build_meta"
4
+
5
+ [project]
6
+ name = "vibevoice"
7
+ version = "0.0.1"
8
+ authors = [
9
+ { name="vibevoice team", email="[email protected]" },
10
+ ]
11
+ description = "A model for speech generation with an AR + diffusion architecture."
12
+ readme = "README.md"
13
+ requires-python = ">=3.9"
14
+ classifiers = [
15
+ "Programming Language :: Python :: 3",
16
+ # "License :: OSI Approved :: MIT License",
17
+ "Operating System :: OS Independent",
18
+ ]
19
+ dependencies = [
20
+ "torch",
21
+ "accelerate==1.6.0",
22
+ "transformers==4.51.3", # we develop this project on transformers==4.51.3, later version may not be compatible
23
+ "llvmlite>=0.40.0",
24
+ "numba>=0.57.0",
25
+ "diffusers",
26
+ "tqdm",
27
+ "numpy",
28
+ "scipy",
29
+ "librosa",
30
+ "ml-collections",
31
+ "absl-py",
32
+ "gradio",
33
+ "av",
34
+ "aiortc",
35
+ "uvicorn[standard]",
36
+ "fastapi"
37
+ ]
38
+
39
+
40
+ [project.urls]
41
+ "Homepage" = "https://github.com/microsoft/VibeVoice"
42
+ "Bug Tracker" = "https://github.com/microsoft/VibeVoice/issues"
43
+
44
+ [tool.setuptools.packages.find]
45
+ where = ["."]
requirements.txt ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ torch
2
+ accelerate==1.6.0
3
+ transformers==4.51.3
4
+ llvmlite>=0.40.0
5
+ numba>=0.57.0
6
+ diffusers
7
+ tqdm
8
+ numpy
9
+ scipy
10
+ librosa
11
+ ml-collections
12
+ absl-py
13
+ gradio
14
+ av
15
+ aiortc
16
+ uvicorn[standard]
17
+ fastapi