Spaces:

alvinichi
/

imageToVideo

Running

App Files Files Community

alvinichi commited on Apr 17

Commit

5b61f28

1 Parent(s): 6be96f1

update

Browse files

Files changed (1) hide show

app.py +149 -76

app.py CHANGED Viewed

@@ -9,15 +9,16 @@ from skimage import img_as_ubyte
 import gradio as gr
 from PIL import Image
 import tempfile
-# Đảm bảo cài đặt các thư viện cần thiết trước khi import
 subprocess.check_call([sys.executable, "-m", "pip", "install", "scikit-learn"])
 subprocess.check_call([sys.executable, "-m", "pip", "install", "scikit-image==0.19.3"])
 subprocess.check_call([sys.executable, "-m", "pip", "install", "face-alignment==1.3.5"])
 subprocess.check_call([sys.executable, "-m", "pip", "install", "PyYAML==5.3.1"])
 subprocess.check_call([sys.executable, "-m", "pip", "install", "imageio-ffmpeg==0.4.5"])
-subprocess.check_call([sys.executable, "-m", "pip", "install", "gdown"])
-subprocess.check_call([sys.executable, "-m", "pip", "install", "huggingface_hub"])
 # Cài đặt ffmpeg trong môi trường Ubuntu
 os.system("apt-get update && apt-get install -y ffmpeg")
@@ -95,77 +96,100 @@ def normalize_kp(kp_source, kp_driving, kp_driving_initial,
 # Import hàm load_checkpoints từ file helper
 from load_helper import load_checkpoints, normalize_kp
-# Tải mô hình pre-trained với phương pháp cải tiến
 def download_model():
-    try:
-        # Thử phương pháp sử dụng gdown trước
-        model_path = 'checkpoints/vox-cpk.pth.tar'
-        if not os.path.exists('checkpoints'):
-            os.makedirs('checkpoints', exist_ok=True)
-        # Kiểm tra xem file đã tồn tại và đủ lớn chưa
-        if not os.path.exists(model_path) or os.path.getsize(model_path) < 1000000:
-            print("Đang tải mô hình từ Google Drive...")
-            import gdown
-            file_id = '1PyQJmkdCsAkOYwUyaj_l-l0as-iLDgeH'
-            gdown.download(f"https://drive.google.com/uc?id={file_id}", model_path, quiet=False)
-        config_path = 'first_order_model/config/vox-256.yaml'
-        if not os.path.exists('first_order_model/config'):
-            os.makedirs('first_order_model/config', exist_ok=True)
-        if not os.path.exists(config_path) or os.path.getsize(config_path) < 1000:
-            print("Đang tải file cấu hình từ Google Drive...")
-            import gdown
-            file_id = '1pZUMNRjkBiuBEM68oj9nskuWgJR-5QMn'
-            gdown.download(f"https://drive.google.com/uc?id={file_id}", config_path, quiet=False)
-        # Kiểm tra lại kích thước file
-        if os.path.exists(model_path) and os.path.getsize(model_path) > 1000000 and os.path.exists(config_path) and os.path.getsize(config_path) > 1000:
-            return config_path, model_path
-        # Nếu gdown không thành công, thử phương pháp sử dụng Hugging Face
-        raise Exception("Tải mô hình từ Google Drive không thành công. Chuyển sang sử dụng Hugging Face...")
-    except Exception as e:
-        print(f"Lỗi khi tải từ Google Drive: {str(e)}")
-        return download_model_alternative()
-def download_model_alternative():
-    try:
-        print("Đang tải mô hình từ Hugging Face...")
-        from huggingface_hub import hf_hub_download
-        model_path = hf_hub_download(
-            repo_id="ycyunwei/first-order-motion-model",
-            filename="vox-cpk.pth.tar"
-        )
-        config_path = hf_hub_download(
-            repo_id="ycyunwei/first-order-motion-model",
-            filename="vox-256.yaml"
-        )
-        return config_path, model_path
-    except Exception as e:
-        print(f"Lỗi khi tải từ Hugging Face: {str(e)}")
-        # Thử phương pháp cuối cùng - sử dụng direct link
-        model_path = 'checkpoints/vox-cpk.pth.tar'
-        if not os.path.exists('checkpoints'):
-            os.makedirs('checkpoints', exist_ok=True)
-        os.system(f'wget -O {model_path} https://github.com/AliaksandrSiarohin/first-order-model/releases/download/v1.0.0/vox-cpk.pth.tar')
-        config_path = 'first_order_model/config/vox-256.yaml'
-        if not os.path.exists('first_order_model/config'):
-            os.makedirs('first_order_model/config', exist_ok=True)
-        os.system(f'wget -O {config_path} https://raw.githubusercontent.com/AliaksandrSiarohin/first-order-model/master/config/vox-256.yaml')
-        if os.path.exists(model_path) and os.path.getsize(model_path) > 1000000 and os.path.exists(config_path) and os.path.getsize(config_path) > 1000:
-            return config_path, model_path
-        else:
-            raise Exception("Không thể tải mô hình bằng cả ba phương pháp. Vui lòng thử lại sau.")
 # Hàm tạo animation
 def make_animation(source_image, driving_video, relative=True, adapt_movement_scale=True):
@@ -233,6 +257,59 @@ def make_animation(source_image, driving_video, relative=True, adapt_movement_sc
     return output_path
 # Định nghĩa giao diện Gradio
 def animate_fomm(source_image, driving_video_file, relative=True, adapt_scale=True):
     if source_image is None:
@@ -252,11 +329,7 @@ def animate_fomm(source_image, driving_video_file, relative=True, adapt_scale=Tr
         # Kiểm tra nếu đã chọn sử dụng video mẫu
         if driving_video_file is None:
             # Tải và sử dụng video mẫu
-            sample_path = "sample_driving.mp4"
-            if not os.path.exists(sample_path) or os.path.getsize(sample_path) < 10000:
-                print("Đang tải video mẫu...")
-                os.system("wget -O sample_driving.mp4 https://github.com/AliaksandrSiarohin/first-order-model/raw/master/driving.mp4")
-            driving_path = sample_path
         else:
             # Xử lý video được tải lên
             if isinstance(driving_video_file, str):

 import gradio as gr
 from PIL import Image
 import tempfile
+import requests
+from io import BytesIO
+# Đảm bảo cài đặt các thư viện cần thiết
 subprocess.check_call([sys.executable, "-m", "pip", "install", "scikit-learn"])
 subprocess.check_call([sys.executable, "-m", "pip", "install", "scikit-image==0.19.3"])
 subprocess.check_call([sys.executable, "-m", "pip", "install", "face-alignment==1.3.5"])
 subprocess.check_call([sys.executable, "-m", "pip", "install", "PyYAML==5.3.1"])
 subprocess.check_call([sys.executable, "-m", "pip", "install", "imageio-ffmpeg==0.4.5"])
+subprocess.check_call([sys.executable, "-m", "pip", "install", "requests"])
 # Cài đặt ffmpeg trong môi trường Ubuntu
 os.system("apt-get update && apt-get install -y ffmpeg")
 # Import hàm load_checkpoints từ file helper
 from load_helper import load_checkpoints, normalize_kp
+# Tải mô hình từ GitHub hoặc mirrors của first-order-model
 def download_model():
+    # URLs trực tiếp từ sources khác
+    checkpoint_urls = [
+        "https://github.com/AliaksandrSiarohin/first-order-model/releases/download/v1.0.0/vox-cpk.pth.tar",
+        "https://raw.githubusercontent.com/jiupinjia/stylized-neural-painting/main/checkpoints/vox-cpk.pth.tar",
+        "https://github.com/snap-research/articulated-animation/raw/master/checkpoints/vox.pth.tar"
+    ]
+    config_urls = [
+        "https://raw.githubusercontent.com/AliaksandrSiarohin/first-order-model/master/config/vox-256.yaml",
+        "https://gist.githubusercontent.com/anonymous/raw/vox-256.yaml"
+    ]
+    # Tạo thư mục
+    model_path = 'checkpoints/vox-cpk.pth.tar'
+    if not os.path.exists('checkpoints'):
+        os.makedirs('checkpoints', exist_ok=True)
+    config_path = 'first_order_model/config/vox-256.yaml'
+    if not os.path.exists('first_order_model/config'):
+        os.makedirs('first_order_model/config', exist_ok=True)
+    # Tải model checkpoint
+    success = False
+    for url in checkpoint_urls:
+        try:
+            print(f"Đang thử tải mô hình từ: {url}")
+            response = requests.get(url, stream=True, timeout=30)
+            if response.status_code == 200:
+                with open(model_path, 'wb') as f:
+                    for chunk in response.iter_content(chunk_size=8192):
+                        f.write(chunk)
+                # Kiểm tra kích thước file (checkpoint mô hình thường > 100MB)
+                if os.path.getsize(model_path) > 100000000:
+                    success = True
+                    break
+        except Exception as e:
+            print(f"Lỗi khi tải từ {url}: {str(e)}")
+    if not success:
+        raise Exception("Không thể tải mô hình checkpoint từ bất kỳ nguồn nào")
+    # Tải file cấu h��nh
+    config_success = False
+    for url in config_urls:
+        try:
+            print(f"Đang thử tải file cấu hình từ: {url}")
+            response = requests.get(url, timeout=30)
+            if response.status_code == 200:
+                with open(config_path, 'wb') as f:
+                    f.write(response.content)
+                if os.path.getsize(config_path) > 1000:
+                    config_success = True
+                    break
+        except Exception as e:
+            print(f"Lỗi khi tải cấu hình từ {url}: {str(e)}")
+    if not config_success:
+        # Tạo file cấu hình đơn giản nếu không tải được
+        create_simple_config(config_path)
+    return config_path, model_path
+# Tạo file cấu hình đơn giản nếu không tải được
+def create_simple_config(config_path):
+    with open(config_path, 'w') as f:
+        f.write("""
+model_params:
+  common_params:
+    num_kp: 10
+    num_channels: 3
+    estimate_jacobian: true
+  kp_detector_params:
+     temperature: 0.1
+     block_expansion: 32
+     max_features: 1024
+     scale_factor: 0.25
+     num_blocks: 5
+  generator_params:
+    block_expansion: 64
+    max_features: 512
+    num_down_blocks: 2
+    num_bottleneck_blocks: 6
+    estimate_occlusion_map: true
+    dense_motion_params:
+      block_expansion: 64
+      max_features: 1024
+      num_blocks: 5
+      scale_factor: 0.25
+        """)
+    print("Đã tạo file cấu hình đơn giản")
 # Hàm tạo animation
 def make_animation(source_image, driving_video, relative=True, adapt_movement_scale=True):
     return output_path
+# Tải video mẫu
+def download_sample_video():
+    sample_urls = [
+        "https://github.com/AliaksandrSiarohin/first-order-model/raw/master/driving.mp4",
+        "https://raw.githubusercontent.com/jiupinjia/stylized-neural-painting/main/sample/driving.mp4"
+    ]
+    sample_path = "sample_driving.mp4"
+    for url in sample_urls:
+        try:
+            print(f"Đang thử tải video mẫu từ: {url}")
+            response = requests.get(url, timeout=30)
+            if response.status_code == 200:
+                with open(sample_path, 'wb') as f:
+                    f.write(response.content)
+                if os.path.getsize(sample_path) > 10000:  # Kiểm tra kích thước file
+                    return sample_path
+        except Exception as e:
+            print(f"Lỗi khi tải video mẫu từ {url}: {str(e)}")
+    # Nếu không tải được, tạo video đơn giản
+    create_simple_video(sample_path)
+    return sample_path
+# Tạo video đơn giản nếu không tải được video mẫu
+def create_simple_video(output_path):
+    import cv2
+    out = cv2.VideoWriter(output_path, cv2.VideoWriter_fourcc(*'mp4v'), 10, (256, 256))
+    # Tạo 100 khung hình với chuyển động đơn giản
+    for i in range(100):
+        frame = np.zeros((256, 256, 3), dtype=np.uint8)
+        # Vẽ khuôn mặt đơn giản chuyển động
+        x_center = 128 + int(np.sin(i/10) * 20)
+        y_center = 128 + int(np.cos(i/20) * 10)
+        # Vẽ khuôn mặt
+        cv2.circle(frame, (x_center, y_center), 60, (200, 200, 200), -1)  # Mặt
+        cv2.circle(frame, (x_center - 20, y_center - 15), 10, (0, 0, 0), -1)  # Mắt trái
+        cv2.circle(frame, (x_center + 20, y_center - 15), 10, (0, 0, 0), -1)  # Mắt phải
+        # Vẽ miệng
+        mouth_y = y_center + 20 + int(np.sin(i/5) * 5)
+        cv2.ellipse(frame, (x_center, mouth_y), (20, 10), 0, 0, 180, (0, 0, 0), -1)
+        out.write(frame)
+    out.release()
+    print("Đã tạo video đơn giản")
 # Định nghĩa giao diện Gradio
 def animate_fomm(source_image, driving_video_file, relative=True, adapt_scale=True):
     if source_image is None:
         # Kiểm tra nếu đã chọn sử dụng video mẫu
         if driving_video_file is None:
             # Tải và sử dụng video mẫu
+            driving_path = download_sample_video()
         else:
             # Xử lý video được tải lên
             if isinstance(driving_video_file, str):