Spaces:
Running
on
Zero
Running
on
Zero
update app
Browse files
app.py
CHANGED
|
@@ -146,7 +146,7 @@ tts_processor = VibeVoiceStreamingProcessor.from_pretrained(TTS_MODEL_PATH)
|
|
| 146 |
tts_model = VibeVoiceStreamingForConditionalGenerationInference.from_pretrained(
|
| 147 |
TTS_MODEL_PATH,
|
| 148 |
torch_dtype=torch.float16,
|
| 149 |
-
device_map="
|
| 150 |
attn_implementation="sdpa",
|
| 151 |
)
|
| 152 |
tts_model.eval()
|
|
@@ -350,7 +350,7 @@ image_examples = [
|
|
| 350 |
["Extract the contents. [page].", "examples/2.jpg"],
|
| 351 |
]
|
| 352 |
|
| 353 |
-
with gr.Blocks(
|
| 354 |
gr.Markdown("# **Vision-to-VibeVoice-en**", elem_id="main-title")
|
| 355 |
|
| 356 |
with gr.Row():
|
|
|
|
| 146 |
tts_model = VibeVoiceStreamingForConditionalGenerationInference.from_pretrained(
|
| 147 |
TTS_MODEL_PATH,
|
| 148 |
torch_dtype=torch.float16,
|
| 149 |
+
device_map="cuda",
|
| 150 |
attn_implementation="sdpa",
|
| 151 |
)
|
| 152 |
tts_model.eval()
|
|
|
|
| 350 |
["Extract the contents. [page].", "examples/2.jpg"],
|
| 351 |
]
|
| 352 |
|
| 353 |
+
with gr.Blocks() as demo:
|
| 354 |
gr.Markdown("# **Vision-to-VibeVoice-en**", elem_id="main-title")
|
| 355 |
|
| 356 |
with gr.Row():
|