Spaces:
Running
on
Zero
Running
on
Zero
Commit
·
c2d6fd3
1
Parent(s):
97a5f5d
12 examples test
Browse files- app.py +19 -5
- assets/bowl.mp4 +3 -0
- assets/dog.mp4 +3 -0
- assets/fruit.mp4 +3 -0
- assets/gameplay.mp4 +3 -0
- assets/greenhouse.mp4 +3 -0
- assets/ketchup.mp4 +3 -0
- assets/office.mp4 +3 -0
- assets/old_man.mp4 +3 -0
- assets/pants.mp4 +3 -0
- assets/teaser_test.json +73 -13
- assets/three_people.mp4 +3 -0
- videox_fun/ui/ui.py +2 -1
app.py
CHANGED
|
@@ -137,7 +137,7 @@ class VideoCoF_Controller(Wan_Controller):
|
|
| 137 |
reasoning_frames_slider=4,
|
| 138 |
repeat_rope_checkbox=True,
|
| 139 |
# New arg for acceleration
|
| 140 |
-
enable_acceleration=
|
| 141 |
fps=8,
|
| 142 |
is_api=False,
|
| 143 |
):
|
|
@@ -337,7 +337,7 @@ def ui(GPU_memory_mode, scheduler_dict, config_path, compile_dit, weight_dtype):
|
|
| 337 |
reasoning_frames_slider = gr.Slider(label="Reasoning Frames", minimum=1, maximum=20, value=4, step=1)
|
| 338 |
repeat_rope_checkbox = gr.Checkbox(label="Repeat RoPE", value=True)
|
| 339 |
# Add Acceleration Checkbox
|
| 340 |
-
enable_acceleration = gr.Checkbox(label="Enable 4-step Acceleration (FusionX LoRA)", value=
|
| 341 |
|
| 342 |
# Use custom height/width creation to hide/customize
|
| 343 |
resize_method, width_slider, height_slider, base_resolution = create_height_width_english(
|
|
@@ -354,11 +354,25 @@ def ui(GPU_memory_mode, scheduler_dict, config_path, compile_dit, weight_dtype):
|
|
| 354 |
|
| 355 |
# Simplified input for VideoCoF - mainly Video to Video.
|
| 356 |
image_to_video_col, video_to_video_col, control_video_col, source_method, start_image, template_gallery, end_image, validation_video, validation_video_mask, denoise_strength, control_video, ref_image = create_generation_method(
|
| 357 |
-
["Video to Video"],
|
|
|
|
|
|
|
|
|
|
| 358 |
video_examples=[
|
| 359 |
["assets/two_man.mp4", "Remove the young man with short black hair wearing black shirt on the left."],
|
| 360 |
-
["assets/
|
| 361 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 362 |
)
|
| 363 |
|
| 364 |
# Ensure validation_video is visible and interactive
|
|
|
|
| 137 |
reasoning_frames_slider=4,
|
| 138 |
repeat_rope_checkbox=True,
|
| 139 |
# New arg for acceleration
|
| 140 |
+
enable_acceleration=True,
|
| 141 |
fps=8,
|
| 142 |
is_api=False,
|
| 143 |
):
|
|
|
|
| 337 |
reasoning_frames_slider = gr.Slider(label="Reasoning Frames", minimum=1, maximum=20, value=4, step=1)
|
| 338 |
repeat_rope_checkbox = gr.Checkbox(label="Repeat RoPE", value=True)
|
| 339 |
# Add Acceleration Checkbox
|
| 340 |
+
enable_acceleration = gr.Checkbox(label="Enable 4-step Acceleration (FusionX LoRA)", value=True)
|
| 341 |
|
| 342 |
# Use custom height/width creation to hide/customize
|
| 343 |
resize_method, width_slider, height_slider, base_resolution = create_height_width_english(
|
|
|
|
| 354 |
|
| 355 |
# Simplified input for VideoCoF - mainly Video to Video.
|
| 356 |
image_to_video_col, video_to_video_col, control_video_col, source_method, start_image, template_gallery, end_image, validation_video, validation_video_mask, denoise_strength, control_video, ref_image = create_generation_method(
|
| 357 |
+
["Video to Video"],
|
| 358 |
+
prompt_textbox,
|
| 359 |
+
support_end_image=False,
|
| 360 |
+
default_video="assets/two_man.mp4",
|
| 361 |
video_examples=[
|
| 362 |
["assets/two_man.mp4", "Remove the young man with short black hair wearing black shirt on the left."],
|
| 363 |
+
["assets/three_people.mp4", "Remove the man with short dark hair wearing a gray suit on the right"],
|
| 364 |
+
["assets/office.mp4", "Remove the beige CRT computer setup."],
|
| 365 |
+
["assets/woman_ballon.mp4", "Add the woman in a floral dress pointing at the balloon on the left."],
|
| 366 |
+
["assets/greenhouse.mp4", "A white Samoyed is watching the man, who crouches in a greenhouse. The Samoyed is covered in thick, fluffy white fur, giving it a very soft and plush appearance. Its ears are erect and triangular, making it look alert and intelligent. The Samoyed's face features its signature smile, with bright black eyes that convey friendliness and curiosity."],
|
| 367 |
+
["assets/gameplay.mp4", "Add the woman holding the blue game controller to the left of the man, engaged in gameplay."],
|
| 368 |
+
["assets/dog.mp4", "Add the brown and white beagle interacting with and drinking from the metallic bowl on the wooden floor."],
|
| 369 |
+
["assets/sign.mp4", "Replace the yellow \"SCHOOL\" sign with a red hospital sign, featuring a white hospital emblem on the top and the word \"HOSPITAL\" below."],
|
| 370 |
+
["assets/old_man.mp4", "Swap the old man with long white hair and a blue checkered shirt at the left side of the frame with a woman with curly brown hair and a denim shirt."],
|
| 371 |
+
["assets/pants.mp4", "swap the white pants worn by the individual the light blue jeans."],
|
| 372 |
+
["assets/bowl.mp4", "Make the largest cup on the right white and smooth."],
|
| 373 |
+
["assets/ketchup.mp4", "Make the ketchup bottle to the right of the BBQ sauce bottle violet color."],
|
| 374 |
+
["assets/fruit.mp4", "Make the pomegranate at the right side of the basket lavender color."]
|
| 375 |
+
],
|
| 376 |
)
|
| 377 |
|
| 378 |
# Ensure validation_video is visible and interactive
|
assets/bowl.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a5eabc70819e2f38bcbe00bcedacca504d1d6fa8947b065f8ed6db3f3beca4e
|
| 3 |
+
size 110870
|
assets/dog.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f0186100a5c50a360138bb8c1fbf2dc5183540fe1bdd6cef69588736fbdd56b
|
| 3 |
+
size 150554
|
assets/fruit.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df32c3d87501138a12f2dd7246bf6cf143d5b7bfbfe0f2b6e7f8bec372416eaa
|
| 3 |
+
size 95209
|
assets/gameplay.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2356c2037dd49d31c7417201f0c640998385731c2c1cbe0aae70472f285f09a9
|
| 3 |
+
size 99302
|
assets/greenhouse.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97e1cfdb33a56f67b2a94140d5cfe8c0d79f5a060bbb00088e218d2813732650
|
| 3 |
+
size 929837
|
assets/ketchup.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2dd7b6b770e3c68fc8ae2969942b1819eb039b207a8560fd58dd40fbe1846ab3
|
| 3 |
+
size 134873
|
assets/office.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bca3c3764accff6f8b30f369ecbac4f42c3264b3258d0a9a87e23cfeb34a900a
|
| 3 |
+
size 149972
|
assets/old_man.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d40af0ec801bf0588b44de78a54ab7400ba741f7da076aac2f56e4407f8823f4
|
| 3 |
+
size 157209
|
assets/pants.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0405672ded659ed6dc15d0b0b708e370f295a012e96fddb1750dbafb1865d602
|
| 3 |
+
size 191056
|
assets/teaser_test.json
CHANGED
|
@@ -1,20 +1,80 @@
|
|
| 1 |
[
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
{
|
| 3 |
"task_type": "obj_add",
|
| 4 |
"sample_id": "001",
|
| 5 |
"source_video_path": "assets/woman_ballon.mp4",
|
| 6 |
"qwen_vl_72b_refined_instruction": "Add the woman in a floral dress pointing at the balloon on the left."
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
|
| 14 |
-
|
| 15 |
-
|
| 16 |
-
|
| 17 |
-
|
| 18 |
-
|
| 19 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 20 |
]
|
|
|
|
| 1 |
[
|
| 2 |
+
{
|
| 3 |
+
"task_type": "obj_rem",
|
| 4 |
+
"sample_id": "001",
|
| 5 |
+
"source_video_path": "assets/two_man.mp4",
|
| 6 |
+
"qwen_vl_72b_refined_instruction": "Remove the young man with short black hair wearing black shirt on the left."
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"task_type": "obj_rem",
|
| 10 |
+
"sample_id": "002",
|
| 11 |
+
"source_video_path": "assets/three_people.mp4",
|
| 12 |
+
"qwen_vl_72b_refined_instruction": "Remove the man with short dark hair wearing a gray suit on the right"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"task_type": "obj_rem",
|
| 16 |
+
"sample_id": "003",
|
| 17 |
+
"source_video_path": "assets/office.mp4",
|
| 18 |
+
"qwen_vl_72b_refined_instruction": "Remove the beige CRT computer setup."
|
| 19 |
+
},
|
| 20 |
{
|
| 21 |
"task_type": "obj_add",
|
| 22 |
"sample_id": "001",
|
| 23 |
"source_video_path": "assets/woman_ballon.mp4",
|
| 24 |
"qwen_vl_72b_refined_instruction": "Add the woman in a floral dress pointing at the balloon on the left."
|
| 25 |
+
},
|
| 26 |
+
{
|
| 27 |
+
"task_type": "obj_add",
|
| 28 |
+
"sample_id": "002",
|
| 29 |
+
"source_video_path": "assets/greenhouse.mp4",
|
| 30 |
+
"qwen_vl_72b_refined_instruction": "A white Samoyed is watching the man, who crouches in a greenhouse. The Samoyed is covered in thick, fluffy white fur, giving it a very soft and plush appearance. Its ears are erect and triangular, making it look alert and intelligent. The Samoyed's face features its signature smile, with bright black eyes that convey friendliness and curiosity."
|
| 31 |
+
},
|
| 32 |
+
{
|
| 33 |
+
"task_type": "obj_add",
|
| 34 |
+
"sample_id": "003",
|
| 35 |
+
"source_video_path": "assets/gameplay.mp4",
|
| 36 |
+
"qwen_vl_72b_refined_instruction": "Add the woman holding the blue game controller to the left of the man, engaged in gameplay."
|
| 37 |
+
},
|
| 38 |
+
{
|
| 39 |
+
"task_type": "obj_add",
|
| 40 |
+
"sample_id": "004",
|
| 41 |
+
"source_video_path": "assets/dog.mp4",
|
| 42 |
+
"qwen_vl_72b_refined_instruction": "Add the brown and white beagle interacting with and drinking from the metallic bowl on the wooden floor."
|
| 43 |
+
},
|
| 44 |
+
{
|
| 45 |
+
"task_type": "obj_swap",
|
| 46 |
+
"sample_id": "001",
|
| 47 |
+
"source_video_path": "assets/sign.mp4",
|
| 48 |
+
"qwen_vl_72b_refined_instruction": "Replace the yellow \"SCHOOL\" sign with a red hospital sign, featuring a white hospital emblem on the top and the word \"HOSPITAL\" below."
|
| 49 |
+
},
|
| 50 |
+
{
|
| 51 |
+
"task_type": "obj_swap",
|
| 52 |
+
"sample_id": "002",
|
| 53 |
+
"source_video_path": "assets/old_man.mp4",
|
| 54 |
+
"qwen_vl_72b_refined_instruction": "Swap the old man with long white hair and a blue checkered shirt at the left side of the frame with a woman with curly brown hair and a denim shirt."
|
| 55 |
+
},
|
| 56 |
+
{
|
| 57 |
+
"task_type": "obj_swap",
|
| 58 |
+
"sample_id": "003",
|
| 59 |
+
"source_video_path": "assets/pants.mp4",
|
| 60 |
+
"qwen_vl_72b_refined_instruction": "swap the white pants worn by the individual the light blue jeans."
|
| 61 |
+
},
|
| 62 |
+
{
|
| 63 |
+
"task_type": "local_style",
|
| 64 |
+
"sample_id": "001",
|
| 65 |
+
"source_video_path": "assets/bowl.mp4",
|
| 66 |
+
"qwen_vl_72b_refined_instruction": "Make the largest cup on the right white and smooth."
|
| 67 |
+
},
|
| 68 |
+
{
|
| 69 |
+
"task_type": "local_style",
|
| 70 |
+
"sample_id": "002",
|
| 71 |
+
"source_video_path": "assets/ketchup.mp4",
|
| 72 |
+
"qwen_vl_72b_refined_instruction": "Make the ketchup bottle to the right of the BBQ sauce bottle violet color."
|
| 73 |
+
},
|
| 74 |
+
{
|
| 75 |
+
"task_type": "local_style",
|
| 76 |
+
"sample_id": "003",
|
| 77 |
+
"source_video_path": "assets/fruit.mp4",
|
| 78 |
+
"qwen_vl_72b_refined_instruction": "Make the pomegranate at the right side of the basket lavender color."
|
| 79 |
+
}
|
| 80 |
]
|
assets/three_people.mp4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3c8a49ff5e5b8ec439734b9108eb4e0791c0486fc9c0e1d1bcb440f8febbfe1
|
| 3 |
+
size 549213
|
videox_fun/ui/ui.py
CHANGED
|
@@ -291,7 +291,8 @@ def create_generation_method(source_method_options, prompt_textbox, support_end_
|
|
| 291 |
gr.Examples(
|
| 292 |
examples=video_examples,
|
| 293 |
inputs=[validation_video, prompt_textbox] if len(video_examples[0]) > 1 else validation_video,
|
| 294 |
-
label="Video Examples"
|
|
|
|
| 295 |
)
|
| 296 |
|
| 297 |
# Removed Mask Accordion entirely per request or hidden. User said "mask这个不需要"
|
|
|
|
| 291 |
gr.Examples(
|
| 292 |
examples=video_examples,
|
| 293 |
inputs=[validation_video, prompt_textbox] if len(video_examples[0]) > 1 else validation_video,
|
| 294 |
+
label="Video Examples",
|
| 295 |
+
examples_per_page=6,
|
| 296 |
)
|
| 297 |
|
| 298 |
# Removed Mask Accordion entirely per request or hidden. User said "mask这个不需要"
|