Spaces:

decart-ai
/

lucy-edit-dev

Running on Zero

App Files Files Community

Make Enhance Prompt an option

by multimodalart HF Staff - opened Sep 18

base: refs/heads/main

←

from: refs/pr/3

Discussion Files changed

+38

-37

Files changed (4) hide show

.gitattributes +0 -2
app.py +38 -29
examples/neon.mp4 +0 -3
examples/painter.mp4 +0 -3

.gitattributes CHANGED Viewed

@@ -36,5 +36,3 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 examples/man_walking.mp4 filter=lfs diff=lfs merge=lfs -text
 examples/leopard.mp4 filter=lfs diff=lfs merge=lfs -text
 examples/woman.mp4 filter=lfs diff=lfs merge=lfs -text
-examples/neon.mp4 filter=lfs diff=lfs merge=lfs -text
-examples/painter.mp4 filter=lfs diff=lfs merge=lfs -text

 examples/man_walking.mp4 filter=lfs diff=lfs merge=lfs -text
 examples/leopard.mp4 filter=lfs diff=lfs merge=lfs -text
 examples/woman.mp4 filter=lfs diff=lfs merge=lfs -text

app.py CHANGED Viewed

@@ -18,20 +18,20 @@ def calculate_resolution(input_width, input_height, min_dimension=480, max_dimen
     # Ensure dimensions are multiples of the compatible rounding
     def round_to(x, compatible_round):
         return max(min_dimension, min(max_dimension, int(round(x / compatible_round) * compatible_round)))
     # Get aspect ratio
     aspect_ratio = input_width / input_height
     # Square videos (aspect ratio close to 1:1)
     if 0.98 <= aspect_ratio <= 1.02:
         return 640, 640
     # Landscape videos (width > height)
     elif aspect_ratio > 1:
         # Try to use max width
         new_width = max_dimension
         new_height = new_width / aspect_ratio
         # If height would be too small, use min height
         if new_height < min_dimension:
             new_height = min_dimension
@@ -39,15 +39,15 @@ def calculate_resolution(input_width, input_height, min_dimension=480, max_dimen
             # If width exceeds max, clamp it
             if new_width > max_dimension:
                 new_width = max_dimension
         return round_to(new_width, compatible_round), round_to(new_height, compatible_round)
     # Portrait videos (height > width)
     else:
         # Try to use max height
         new_height = max_dimension
         new_width = new_height * aspect_ratio
         # If width would be too small, use min width
         if new_width < min_dimension:
             new_width = min_dimension
@@ -55,7 +55,7 @@ def calculate_resolution(input_width, input_height, min_dimension=480, max_dimen
             # If height exceeds max, clamp it
             if new_height > max_dimension:
                 new_height = max_dimension
         return round_to(new_width, compatible_round), round_to(new_height, compatible_round)
@@ -64,6 +64,7 @@ def process_video(
     video_path,
     prompt,
     negative_prompt="",
     num_frames=81,
     auto_resize=True,
     manual_height=480,
@@ -74,12 +75,16 @@ def process_video(
     # Load and preprocess video
     progress(0.2, desc="Loading video...")
     # Get video dimensions
     temp_video = load_video(video_path)
     print(len(temp_video))
     if temp_video and len(temp_video) > 0:
         original_width, original_height = temp_video[0].size
         # Calculate dimensions
         if auto_resize:
             width, height = calculate_resolution(original_width, original_height)
@@ -87,7 +92,7 @@ def process_video(
             width, height = manual_width, manual_height
     else:
         raise gr.Error("Could not load video or video is empty")
     # Convert video function
     def convert_video(video: List[Image.Image]) -> List[Image.Image]:
         # Ensure we don't exceed the video length
@@ -96,14 +101,14 @@ def process_video(
         # Resize frames
         video_frames = [frame.resize((width, height)) for frame in video_frames]
         return video_frames
     # Load video from file path
     video = load_video(video_path, convert_method=convert_video)
     # Ensure we have the right number of frames
     if len(video) < num_frames:
         num_frames = len(video)
     # Generate edited video
     progress(0.5, desc="Generating edited video...")
     output = pipe(
@@ -115,14 +120,14 @@ def process_video(
         num_frames=num_frames,
         guidance_scale=guidance_scale,
     ).frames[0]
     # Export to temporary file
     progress(0.9, desc="Exporting video...")
     with tempfile.NamedTemporaryFile(delete=False, suffix=".mp4") as tmp_file:
         output_path = tmp_file.name
     export_to_video(output, output_path, fps=24)
     progress(1.0, desc="Complete!")
     return output_path
@@ -141,19 +146,21 @@ with gr.Blocks(title="Lucy Edit - Video Editing with Text", css=css) as demo:
   &nbsp;|&nbsp; 📑 <a href="#">arXiv (Coming soon)</a>
   &nbsp;|&nbsp; 💬 <a href="https://discord.gg/decart">Discord</a>
 </p>""")
     with gr.Row():
         with gr.Column(scale=1):
             # Input controls
             video_input = gr.Video(label="Input Video")
             prompt = gr.Textbox(
                 label="Edit Prompt",
                 placeholder="Describe what you want to change in the video...",
                 lines=3
             )
             with gr.Accordion("Advanced Settings", open=False):
                 negative_prompt = gr.Textbox(
                     label="Negative Prompt (optional)",
                     placeholder="Describe what you DON'T want in the video...",
@@ -164,7 +171,7 @@ with gr.Blocks(title="Lucy Edit - Video Editing with Text", css=css) as demo:
                     value=True,
                     info="Automatically calculate dimensions based on input video"
                 )
                 num_frames = gr.Slider(
                     label="Number of Frames",
                     minimum=1,
@@ -173,7 +180,7 @@ with gr.Blocks(title="Lucy Edit - Video Editing with Text", css=css) as demo:
                     step=1,
                     info="More frames = longer processing time"
                 )
                 with gr.Row():
                     manual_height = gr.Slider(
                         label="Height (when auto-resize is off)",
@@ -189,7 +196,7 @@ with gr.Blocks(title="Lucy Edit - Video Editing with Text", css=css) as demo:
                         value=832,
                         step=32
                     )
                 guidance_scale = gr.Slider(
                     label="Guidance Scale",
                     minimum=1.0,
@@ -198,23 +205,24 @@ with gr.Blocks(title="Lucy Edit - Video Editing with Text", css=css) as demo:
                     step=0.5,
                     info="Higher values follow the prompt more strictly"
                 )
             generate_btn = gr.Button("Edit Video", variant="primary")
         with gr.Column(scale=1):
-            video_output = gr.Video(label="Edited Video", autoplay=True)
     gr.Examples(
         examples=[
-            ["examples/neon.mp4", "Add a colorful scarlet macaw parrot perched on the man's left shoulder, bright red and blue wing feathers with yellow accents, curved black beak, intelligent dark eyes, talons gripping fabric naturally, long tail feathers extending downward, glossy plumage catching light, slight wing adjustment for balance, natural weight distribution, soft shadow beneath bird."],
-            ["examples/painter.mp4",  "Change the hair color to platinum blonde with natural highlights, subtle root shadowing, silky texture, gentle waves, soft shine, dimensional tones, strand definition, natural movement, professional color treatment, salon-quality finish, light-catching shimmer, varied blonde shades from honey to ash, realistic color gradation, healthy glossy appearance, volumetric lighting interaction."],
         ],
         inputs=[video_input, prompt],
         outputs=video_output,
         fn=process_video,
         cache_examples="lazy",
     )
     # Event handlers
     generate_btn.click(
         fn=process_video,
@@ -222,6 +230,7 @@ with gr.Blocks(title="Lucy Edit - Video Editing with Text", css=css) as demo:
             video_input,
             prompt,
             negative_prompt,
             num_frames,
             auto_resize,
             manual_height,
@@ -232,4 +241,4 @@ with gr.Blocks(title="Lucy Edit - Video Editing with Text", css=css) as demo:
     )
 if __name__ == "__main__":
-    demo.launch(share=True)

     # Ensure dimensions are multiples of the compatible rounding
     def round_to(x, compatible_round):
         return max(min_dimension, min(max_dimension, int(round(x / compatible_round) * compatible_round)))
     # Get aspect ratio
     aspect_ratio = input_width / input_height
     # Square videos (aspect ratio close to 1:1)
     if 0.98 <= aspect_ratio <= 1.02:
         return 640, 640
     # Landscape videos (width > height)
     elif aspect_ratio > 1:
         # Try to use max width
         new_width = max_dimension
         new_height = new_width / aspect_ratio
         # If height would be too small, use min height
         if new_height < min_dimension:
             new_height = min_dimension
             # If width exceeds max, clamp it
             if new_width > max_dimension:
                 new_width = max_dimension
         return round_to(new_width, compatible_round), round_to(new_height, compatible_round)
     # Portrait videos (height > width)
     else:
         # Try to use max height
         new_height = max_dimension
         new_width = new_height * aspect_ratio
         # If width would be too small, use min width
         if new_width < min_dimension:
             new_width = min_dimension
             # If height exceeds max, clamp it
             if new_height > max_dimension:
                 new_height = max_dimension
         return round_to(new_width, compatible_round), round_to(new_height, compatible_round)
     video_path,
     prompt,
     negative_prompt="",
+    enhance_prompt=True,
     num_frames=81,
     auto_resize=True,
     manual_height=480,
     # Load and preprocess video
     progress(0.2, desc="Loading video...")
+    if(enhance_prompt):
+        #add here the prompt enhancement API call
+        pass
     # Get video dimensions
     temp_video = load_video(video_path)
     print(len(temp_video))
     if temp_video and len(temp_video) > 0:
         original_width, original_height = temp_video[0].size
         # Calculate dimensions
         if auto_resize:
             width, height = calculate_resolution(original_width, original_height)
             width, height = manual_width, manual_height
     else:
         raise gr.Error("Could not load video or video is empty")
     # Convert video function
     def convert_video(video: List[Image.Image]) -> List[Image.Image]:
         # Ensure we don't exceed the video length
         # Resize frames
         video_frames = [frame.resize((width, height)) for frame in video_frames]
         return video_frames
     # Load video from file path
     video = load_video(video_path, convert_method=convert_video)
     # Ensure we have the right number of frames
     if len(video) < num_frames:
         num_frames = len(video)
     # Generate edited video
     progress(0.5, desc="Generating edited video...")
     output = pipe(
         num_frames=num_frames,
         guidance_scale=guidance_scale,
     ).frames[0]
     # Export to temporary file
     progress(0.9, desc="Exporting video...")
     with tempfile.NamedTemporaryFile(delete=False, suffix=".mp4") as tmp_file:
         output_path = tmp_file.name
     export_to_video(output, output_path, fps=24)
     progress(1.0, desc="Complete!")
     return output_path
   &nbsp;|&nbsp; 📑 <a href="#">arXiv (Coming soon)</a>
   &nbsp;|&nbsp; 💬 <a href="https://discord.gg/decart">Discord</a>
 </p>""")
     with gr.Row():
         with gr.Column(scale=1):
             # Input controls
             video_input = gr.Video(label="Input Video")
             prompt = gr.Textbox(
                 label="Edit Prompt",
                 placeholder="Describe what you want to change in the video...",
                 lines=3
             )
             with gr.Accordion("Advanced Settings", open=False):
+                enhance_prompt = gr.Checkbox(label="Enhance Prompt", value=True)
                 negative_prompt = gr.Textbox(
                     label="Negative Prompt (optional)",
                     placeholder="Describe what you DON'T want in the video...",
                     value=True,
                     info="Automatically calculate dimensions based on input video"
                 )
                 num_frames = gr.Slider(
                     label="Number of Frames",
                     minimum=1,
                     step=1,
                     info="More frames = longer processing time"
                 )
                 with gr.Row():
                     manual_height = gr.Slider(
                         label="Height (when auto-resize is off)",
                         value=832,
                         step=32
                     )
                 guidance_scale = gr.Slider(
                     label="Guidance Scale",
                     minimum=1.0,
                     step=0.5,
                     info="Higher values follow the prompt more strictly"
                 )
             generate_btn = gr.Button("Edit Video", variant="primary")
         with gr.Column(scale=1):
+            video_output = gr.Video(label="Edited Video")
     gr.Examples(
         examples=[
+            ["examples/man_walking.mp4", "make the man into an alien"],
+            ["examples/leopard.mp4",  "make the leopard into a lion"],
+            ["examples/woman.mp4", "make the woman's coat blue"],
         ],
         inputs=[video_input, prompt],
         outputs=video_output,
         fn=process_video,
         cache_examples="lazy",
     )
     # Event handlers
     generate_btn.click(
         fn=process_video,
             video_input,
             prompt,
             negative_prompt,
+            enhance_prompt,
             num_frames,
             auto_resize,
             manual_height,
     )
 if __name__ == "__main__":
+    demo.launch(share=True)

examples/neon.mp4 DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e62dc89173956d4d22defac1d24f0835c8d8d0490f7969dd13b38429d69165ca
-size 3182890

examples/painter.mp4 DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:37b385068db4c25d8f29104580b3267a4fafc2afbd4235f57a206a587a16e56f
-size 2941421