Spaces:

alvinichi
/

imageToVideo

Running

App Files Files Community

alvinichi commited on Apr 17

Commit

da92cbc

1 Parent(s): dd1db02

udpate lib

Browse files

Files changed (2) hide show

app.py +79 -41
requirements.txt +1 -6

app.py CHANGED Viewed

@@ -1,19 +1,17 @@
 import gradio as gr
 import torch
-from transformers import pipeline
-from huggingface_hub import hf_hub_download
 import os
 from PIL import Image
 import numpy as np
-from moviepy.editor import ImageSequenceClip
 import time
-# Kiểm tra xem có GPU không
 device = "cuda" if torch.cuda.is_available() else "cpu"
 print(f"Using device: {device}")
-# Sử dụng mô hình text-to-video thay thế
-def generate_video(image, prompt, num_frames=16, guidance_scale=7.5):
     if image is None:
         return None, "Vui lòng tải lên một hình ảnh"
@@ -25,36 +23,72 @@ def generate_video(image, prompt, num_frames=16, guidance_scale=7.5):
     image = image.resize((512, 512))
     try:
-        # Lưu hình ảnh tạm thời
-        image_path = "input_image.jpg"
-        image.save(image_path)
-        # Tạo chuỗi khung hình đơn giản (hiệu ứng zoom-in)
         frames = []
-        for i in range(num_frames):
-            # Tạo hiệu ứng zoom
-            zoom_factor = 1.0 + (i / num_frames) * 0.2
-            img_copy = image.copy()
-            # Tính toán kích thước và vị trí crop
-            size = int(img_copy.width / zoom_factor)
-            left = (img_copy.width - size) // 2
-            top = (img_copy.height - size) // 2
-            right = left + size
-            bottom = top + size
-            # Cắt và resize lại hình ảnh
-            cropped = img_copy.crop((left, top, right, bottom))
-            frame = cropped.resize((512, 512))
-            # Thêm hiệu ứng màu dựa theo prompt
-            # (đơn giản hóa - trong thực tế sẽ sử dụng mô hình ML)
-            frames.append(np.array(frame))
         # Tạo video từ các khung hình
-        clip = ImageSequenceClip(frames, fps=8)
         output_path = f"output_video_{int(time.time())}.mp4"
-        clip.write_videofile(output_path, codec="libx264")
         return output_path, "Video đã được tạo thành công!"
     except Exception as e:
@@ -63,16 +97,18 @@ def generate_video(image, prompt, num_frames=16, guidance_scale=7.5):
 # Tạo giao diện Gradio
 with gr.Blocks(title="Ứng dụng tạo video từ hình ảnh") as demo:
     gr.Markdown("# Tạo video từ hình ảnh")
-    gr.Markdown("Tải lên một hình ảnh và nhập mô tả để tạo hiệu ứng chuyển động đơn giản.")
     with gr.Row():
         with gr.Column():
             image_input = gr.Image(type="pil", label="Tải lên hình ảnh")
-            prompt_input = gr.Textbox(label="Mô tả hiệu ứng",
-                                     placeholder="Hiệu ứng bạn muốn...",
-                                     value="Zoom in effect with cinematic lighting")
             num_frames = gr.Slider(minimum=10, maximum=30, value=16, step=2, label="Số khung hình")
-            guidance = gr.Slider(minimum=1.0, maximum=10.0, value=7.5, step=0.5, label="Độ mạnh của hiệu ứng")
             submit_btn = gr.Button("Tạo video")
         with gr.Column():
@@ -81,12 +117,14 @@ with gr.Blocks(title="Ứng dụng tạo video từ hình ảnh") as demo:
     submit_btn.click(
         fn=generate_video,
-        inputs=[image_input, prompt_input, num_frames, guidance],
         outputs=[output_video, output_message]
     )
-    gr.Markdown("### Lưu ý")
-    gr.Markdown("- Đây là phiên bản đơn giản tạo hiệu ứng zoom-in cơ bản")
-    gr.Markdown("- Kích thước hình ảnh sẽ được thay đổi về 512x512 pixel")
 demo.launch()

 import gradio as gr
 import torch
 import os
 from PIL import Image
 import numpy as np
+import imageio
 import time
+# Kiểm tra device
 device = "cuda" if torch.cuda.is_available() else "cpu"
 print(f"Using device: {device}")
+# Hàm tạo video đơn giản
+def generate_video(image, effect_type, num_frames=16, effect_strength=5.0):
     if image is None:
         return None, "Vui lòng tải lên một hình ảnh"
     image = image.resize((512, 512))
     try:
+        # Tạo chuỗi khung hình với hiệu ứng khác nhau
         frames = []
+        if effect_type == "zoom-in":
+            # Hiệu ứng zoom-in
+            for i in range(num_frames):
+                zoom_factor = 1.0 + (i / num_frames) * (effect_strength / 10)
+                img_copy = image.copy()
+                size = int(img_copy.width / zoom_factor)
+                left = (img_copy.width - size) // 2
+                top = (img_copy.height - size) // 2
+                right = left + size
+                bottom = top + size
+                cropped = img_copy.crop((left, top, right, bottom))
+                frame = cropped.resize((512, 512))
+                frames.append(np.array(frame))
+        elif effect_type == "pan-right":
+            # Hiệu ứng pan từ trái sang phải
+            width, height = image.size
+            for i in range(num_frames):
+                offset = int((i / num_frames) * width * (effect_strength / 10))
+                img_copy = image.copy()
+                # Tạo hiệu ứng pan
+                if offset > 0:
+                    # Lấy phần hình ảnh từ offset đến cuối
+                    right_part = img_copy.crop((offset, 0, width, height))
+                    # Lấy phần còn lại từ đầu
+                    left_part = img_copy.crop((0, 0, offset, height))
+                    # Tạo hình ảnh mới
+                    new_img = Image.new('RGB', (width, height))
+                    new_img.paste(right_part, (0, 0))
+                    new_img.paste(left_part, (width - offset, 0))
+                    frames.append(np.array(new_img))
+                else:
+                    frames.append(np.array(img_copy))
+        elif effect_type == "fade":
+            # Hiệu ứng fade in/out
+            base_frame = np.array(image)
+            for i in range(num_frames):
+                # Tính toán độ mờ
+                if i < num_frames / 2:
+                    # Fade in
+                    alpha = i / (num_frames / 2)
+                else:
+                    # Fade out
+                    alpha = 2.0 - (i / (num_frames / 2))
+                # Áp dụng độ mờ
+                frame = (base_frame * alpha * (effect_strength / 5)).astype(np.uint8)
+                frames.append(frame)
+        else:
+            # Mặc định, chỉ thêm hiệu ứng đơn giản
+            for i in range(num_frames):
+                brightness = 1.0 + (effect_strength / 10) * np.sin(2 * np.pi * i / num_frames)
+                frame = (np.array(image) * brightness).clip(0, 255).astype(np.uint8)
+                frames.append(frame)
         # Tạo video từ các khung hình
         output_path = f"output_video_{int(time.time())}.mp4"
+        imageio.mimsave(output_path, frames, fps=8)
         return output_path, "Video đã được tạo thành công!"
     except Exception as e:
 # Tạo giao diện Gradio
 with gr.Blocks(title="Ứng dụng tạo video từ hình ảnh") as demo:
     gr.Markdown("# Tạo video từ hình ảnh")
+    gr.Markdown("Tải lên một hình ảnh và chọn hiệu ứng để tạo video.")
     with gr.Row():
         with gr.Column():
             image_input = gr.Image(type="pil", label="Tải lên hình ảnh")
+            effect_input = gr.Radio(
+                ["zoom-in", "pan-right", "fade", "pulse"],
+                label="Chọn hiệu ứng",
+                value="zoom-in"
+            )
             num_frames = gr.Slider(minimum=10, maximum=30, value=16, step=2, label="Số khung hình")
+            effect_strength = gr.Slider(minimum=1.0, maximum=10.0, value=5.0, step=0.5, label="Độ mạnh của hiệu ứng")
             submit_btn = gr.Button("Tạo video")
         with gr.Column():
     submit_btn.click(
         fn=generate_video,
+        inputs=[image_input, effect_input, num_frames, effect_strength],
         outputs=[output_video, output_message]
     )
+    gr.Markdown("### Hướng dẫn")
+    gr.Markdown("- **Zoom-in**: Hiệu ứng phóng to hình ảnh")
+    gr.Markdown("- **Pan-right**: Hiệu ứng di chuyển từ trái sang phải")
+    gr.Markdown("- **Fade**: Hiệu ứng mờ dần rồi hiện dần")
+    gr.Markdown("- **Pulse**: Hiệu ứng thay đổi độ sáng theo nhịp")
 demo.launch()

requirements.txt CHANGED Viewed

@@ -4,9 +4,4 @@ torchvision
 pillow
 numpy
 imageio==2.31.1
-imageio-ffmpeg
-decorator>=4.0.2
-tqdm>=4.11.2
-proglog<=1.0.0
-requests
-moviepy==1.0.3

 pillow
 numpy
 imageio==2.31.1
+imageio-ffmpeg