gradio-app
diff --git a/‎gradio/routes.py‎
Lines changed: 1 addition & 1 deletion b/‎gradio/routes.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎gradio/screen_recording_utils.py‎
Lines changed: 53 additions & 150 deletions b/‎gradio/screen_recording_utils.py‎
Lines changed: 53 additions & 150 deletions
@@ -1699,7 +1699,7 @@ async def process_recording(
                 "zoom_bottom_right_x": form.get("zoom_bottom_right_x"),
                 "zoom_bottom_right_y": form.get("zoom_bottom_right_y"),
                 "zoom_duration": form.get("zoom_duration"),
-                "zoom_timestamp": form.get("zoom_timestamp"),
+                "zoom_start_frame": form.get("zoom_start_frame"),
             }
 
             print("Zoom parameters in request:", {k: v for k, v in params.items() if k.startswith("zoom_")})
 
@@ -3,19 +3,14 @@
 import shutil
 import tempfile
 import traceback
-import json
+import subprocess
 
 
 async def process_video_with_ffmpeg(input_path, output_path, params):
-    """Process a video with ffmpeg based on the provided parameters."""
     current_input = input_path
     temp_files = [input_path]
 
     try:
-        # Debug: Print all parameters
-        print("Processing video with parameters:", params)
-        
-        # Handle segment removal
         if params.get("remove_segment_start") and params.get("remove_segment_end"):
             start = float(params["remove_segment_start"])
             end = float(params["remove_segment_end"])
@@ -53,9 +48,6 @@ async def process_video_with_ffmpeg(input_path, output_path, params):
                     )
                     stdout, stderr = await process.communicate()
 
-                    if process.returncode != 0:
-                        print(f"FFmpeg before segment error: {stderr.decode()}")
-
                 cmd_after = [
                     "ffmpeg",
                     "-y",
@@ -81,9 +73,6 @@ async def process_video_with_ffmpeg(input_path, output_path, params):
                 )
                 stdout, stderr = await process.communicate()
 
-                if process.returncode != 0:
-                    print(f"FFmpeg after segment error: {stderr.decode()}")
-
                 concat_file = tempfile.mktemp(suffix="_concat.txt")
                 temp_files.append(concat_file)
 
@@ -122,30 +111,18 @@ async def process_video_with_ffmpeg(input_path, output_path, params):
                     )
                     stdout, stderr = await process.communicate()
 
-                    if process.returncode != 0:
-                        print(f"FFmpeg concat error: {stderr.decode()}")
-                    else:
-                        current_input = segment_output
+                    current_input = segment_output
 
                 for file in [before_segment, after_segment, concat_file]:
                     try:
                         if os.path.exists(file):
                             os.unlink(file)
                     except:
                         pass
-
-        # Handle zoom effect with individual coordinates
-        print("Processing zoom effect....", 
-              params.get("zoom_top_left_x"), 
-              params.get("zoom_top_left_y"), 
-              params.get("zoom_bottom_right_x"), 
-              params.get("zoom_bottom_right_y"),
-              params.get("zoom_timestamp"))
 
         if (params.get("zoom_top_left_x") and params.get("zoom_top_left_y") and 
             params.get("zoom_bottom_right_x") and params.get("zoom_bottom_right_y")):
             try:
-                # Parse zoom parameters from individual coordinates
                 zoom_top_left = [
                     float(params.get("zoom_top_left_x")),
                     float(params.get("zoom_top_left_y"))
@@ -155,30 +132,23 @@ async def process_video_with_ffmpeg(input_path, output_path, params):
                     float(params.get("zoom_bottom_right_y"))
                 ]
                 zoom_duration = float(params.get("zoom_duration", 2.0))
-                zoom_timestamp = params.get("zoom_timestamp")
-                
-                print(f"Parsed zoom parameters: top_left={zoom_top_left}, bottom_right={zoom_bottom_right}, duration={zoom_duration}, timestamp={zoom_timestamp}")
+                zoom_start_frame = params.get("zoom_start_frame")
 
-                # Call zoom_in function with timestamp
                 zoom_output, zoom_temp_files = await zoom_in(
                     current_input, 
                     output_path,
                     zoom_top_left, 
                     zoom_bottom_right, 
                     zoom_duration,
-                    zoom_timestamp
+                    zoom_start_frame
                 )
 
-                # Update current input and temp files
                 if zoom_output and zoom_output != current_input:
                     current_input = zoom_output
                     temp_files.extend(zoom_temp_files)
             except Exception as e:
-                print(f"Error applying zoom effect: {str(e)}")
                 traceback.print_exc()
-                # Continue with processing without zoom effect
 
-        # For MP4 output, just ensure it's in compatible format
         final_mp4 = output_path
         cmd = [
             "ffmpeg",
@@ -204,198 +174,131 @@ async def process_video_with_ffmpeg(input_path, output_path, params):
         stdout, stderr = await process.communicate()
 
         if process.returncode != 0:
-            print(f"FFmpeg final MP4 conversion error: {stderr.decode()}")
             shutil.copy(current_input, final_mp4)
 
         current_input = final_mp4
         return current_input, temp_files
 
     except Exception as e:
-        print(f"Error in process_video_with_ffmpeg: {str(e)}")
         traceback.print_exc()
         return input_path, temp_files
 
-async def zoom_in(input_path, output_path, top_left=None, bottom_right=None, zoom_duration=2.0, zoom_timestamp=None):
+async def zoom_in(input_path, output_path, top_left=None, bottom_right=None, zoom_duration=2.0, zoom_start_frame=None):
+    from ffmpy import FFmpeg
     temp_files = []
 
     try:
-        # Validate inputs
         if not input_path or not os.path.exists(input_path):
-            print(f"Input file does not exist: {input_path}")
             return input_path, temp_files
 
-        # Get zoom timestamp (when to start the zoom effect)
-        if zoom_timestamp is None:
-            print("No zoom timestamp provided, defaulting to 2 seconds")
-            zoom_timestamp = 2.0
+        if zoom_start_frame is None:
+            zoom_start_frame = 60
         else:
             try:
-                zoom_timestamp = float(zoom_timestamp)
-                print(f"Using zoom timestamp: {zoom_timestamp} seconds")
+                zoom_start_frame = float(zoom_start_frame)
             except (ValueError, TypeError):
-                print("Invalid zoom timestamp, defaulting to 2 seconds")
-                zoom_timestamp = 2.0
+                zoom_start_frame = 60
 
-        # Default values if coordinates are None
         if top_left is None:
-            print("Using default top_left coordinates (0.25, 0.25)")
             top_left = [0.25, 0.25]
 
         if bottom_right is None:
-            print("Using default bottom_right coordinates (0.75, 0.75)")
             bottom_right = [0.75, 0.75]
 
-        # Print coordinates for debugging
-        print(f"Zoom coordinates: top_left={top_left}, bottom_right={bottom_right}")
-        
-        # Safely extract coordinates
         try:
             x1, y1 = float(top_left[0]), float(top_left[1])
             x2, y2 = float(bottom_right[0]), float(bottom_right[1])
         except (TypeError, ValueError, IndexError) as e:
-            print(f"Error converting coordinates to float: {e}")
-            print("Using default coordinates")
             x1, y1 = 0.25, 0.25
             x2, y2 = 0.75, 0.75
 
-        # Ensure coordinates are within valid range
         x1 = max(0.0, min(0.9, x1))
         y1 = max(0.0, min(0.9, y1))
         x2 = max(0.1, min(1.0, x2))
         y2 = max(0.1, min(1.0, y2))
 
-        # Ensure x2 > x1 and y2 > y1
         if x2 <= x1:
             x1, x2 = 0.25, 0.75
         if y2 <= y1:
             y1, y2 = 0.25, 0.75
 
-        # Get video dimensions
-        # cmd_dimensions = [
-        #     "ffprobe",
-        #     "-v", "error",
-        #     "-select_streams", "v:0",
-        #     "-show_entries", "stream=width,height",
-        #     "-of", "csv=s=x:p=0",
-        #     input_path
-        # ]
-        
-        # process = await asyncio.create_subprocess_exec(
-        #     *cmd_dimensions,
-        #     stdout=asyncio.subprocess.PIPE,
-        #     stderr=asyncio.subprocess.PIPE,
-        # )
-        # stdout, stderr = await process.communicate()
+        duration_cmd = f"ffprobe -v error -show_entries format=duration -of default=noprint_wrappers=1:nokey=1 \"{input_path}\""
 
-        # try:
-        #     dimensions = stdout.decode().strip().split('x')
-        #     width = int(dimensions[0])
-        #     height = int(dimensions[1])
-        #     print(f"Video dimensions: {width}x{height}")
-        # except (ValueError, IndexError):
-        #     print("Could not determine video dimensions, using defaults")
-        # width, height = 1920, 1080
-            
-        # Get video duration
-        cmd_duration = [
-            "ffprobe",
-            "-v", "error",
-            "-show_entries", "format=duration",
-            "-of", "default=noprint_wrappers=1:nokey=1",
-            input_path
-        ]
-
-        process = await asyncio.create_subprocess_exec(
-            *cmd_duration,
+        process = await asyncio.create_subprocess_shell(
+            duration_cmd,
             stdout=asyncio.subprocess.PIPE,
             stderr=asyncio.subprocess.PIPE,
         )
         stdout, stderr = await process.communicate()
 
         try:
-            video_duration = float(stdout.decode().strip())
-            print(f"Video duration: {video_duration} seconds")
-        except (ValueError, TypeError):
-            print(f"Could not determine video duration, using default")
+            output = stdout.decode().strip()
+            video_duration = float(output)
+        except (ValueError, TypeError) as e:
             video_duration = 10.0
 
         zoom_duration = min(float(zoom_duration), video_duration)
-        
-        # Apply the zoom pan effect directly without box
+
         zoom_output = tempfile.mktemp(suffix="_zoomed.mp4")
         temp_files.append(zoom_output)
 
-        # Calculate the center of the specified area
         center_x = (x1 + x2) / 2
         center_y = (y1 + y2) / 2
 
-        # Create a complex filter for the zoom pan effect
-        fps = 25
-        zoom_in_frames = int(0.3 * fps)
-        hold_frames = int(2 * fps)     # 2 seconds to hold
-        zoom_out_frames = int(0.3 * fps)
-        total_frames = zoom_in_frames + hold_frames + zoom_out_frames
+        # zoom_start_frame = 60  # *** TODO: causing issues when replaced with param
+        zoom_in_frames = 15    # Zoom in over 30 frames
+        zoom_out_frames = 15   # Zoom out over 30 frames
+        max_zoom = 2.0        # Maximum zoom level
+        hold_frames = 60
 
-        # Max zoom factor (reduced from 2.0 to 1.5)
-        max_zoom = 1.5
-
-        # Set fixed dimensions
         width, height = 1920, 1080
 
-        # Update the complex filter to remove padding/black bars
         complex_filter = (
-            f"[0:v]split=3[v1][v2][v3];"
-            f"[v1]trim=0:{zoom_timestamp},setpts=PTS-STARTPTS,scale={width}:{height}[intro];"  # Direct scaling
-            f"[v2]trim={zoom_timestamp}:{zoom_timestamp+zoom_duration},setpts=PTS-STARTPTS,"
-            f"scale={width}:{height},"  # Direct scaling without preserving aspect ratio
-            f"zoompan=z='if(lt(on,{zoom_in_frames})," 
-            f"     1+({max_zoom}-1)*on/{zoom_in_frames}," # zoom in phase
-            f"     if(lt(on,{zoom_in_frames+hold_frames}),"
-            f"        {max_zoom}," # hold phase
-            f"        {max_zoom}-({max_zoom}-1)*(on-{zoom_in_frames+hold_frames})/{zoom_out_frames}" # zoom out phase
-            f"     )"
-            f"  )':"
-            f"x='iw*{center_x}-iw/zoom*{center_x}':y='ih*{center_y}-ih/zoom*{center_y}':"
-            f"d={total_frames}:s={width}x{height}:fps={fps}[zoom];"
-            f"[v3]trim={zoom_timestamp+zoom_duration}:{video_duration},setpts=PTS-STARTPTS,scale={width}:{height}[outro];"  # Direct scaling
-            f"[intro][zoom][outro]concat=n=3:v=1:a=0[outv]"
+            f"[0:v]zoompan="
+            f"z='if(between(on,{zoom_start_frame},{zoom_start_frame + zoom_in_frames + hold_frames + zoom_out_frames}),"
+            f"if(lt(on-{zoom_start_frame},{zoom_in_frames}),"
+            f"1+(({max_zoom}-1)*(on-{zoom_start_frame})/{zoom_in_frames}),"
+            f"if(lt(on-{zoom_start_frame},{zoom_in_frames + hold_frames}),"
+            f"{max_zoom},"
+            f"{max_zoom}-(({max_zoom}-1)*((on-{zoom_start_frame}-{zoom_in_frames}-{hold_frames}))/{zoom_out_frames})"
+            f")),1)':"
+            f"x='iw*{center_x}-iw/zoom*{center_x}':"
+            f"y='ih*{center_y}-ih/zoom*{center_y}':"
+            f"d=0:"
+            f"s={width}x{height}[outv]"
         )
 
-        cmd_zoom = [
-            "ffmpeg",
-            "-y",
-            "-i", input_path,
-            "-filter_complex", complex_filter,
-            "-map", "[outv]",
-            "-map", "0:a?",  # Make audio mapping optional with ?
-            "-c:v", "libx264",
-            "-tag:v", "avc3",
-            "-profile:v", "baseline",
-            "-level", "3.0",
-            "-pix_fmt", "yuv420p",
-            "-preset", "fast",
-            "-c:a", "copy",
-            zoom_output,
-        ]
-
-        print(f"Running zoom pan effect command: {' '.join(cmd_zoom)}")
+        ff = FFmpeg(
+            inputs={input_path: None},
+            outputs={
+                zoom_output: (
+                    f"-filter_complex \"{complex_filter}\" "
+                    f"-map \"[outv]\" "
+                    f"-map 0:a? "
+                    f"-c:v libx264 " 
+                    f"-pix_fmt yuv420p "
+                    f"-movflags +faststart "
+                    f"-preset fast "
+                    f"-c:a aac "
+                    f"-y"
+                )
+            }
+        )
 
+        cmd_parts = ff.cmd.split()
         process = await asyncio.create_subprocess_exec(
-            *cmd_zoom,
+            *cmd_parts,
             stdout=asyncio.subprocess.PIPE,
             stderr=asyncio.subprocess.PIPE,
         )
         stdout, stderr = await process.communicate()
 
         if process.returncode != 0:
-            print(f"FFmpeg zoom pan effect error: {stderr.decode()}")
-            print(stderr.decode())
-            # Return the input if zoom fails
+            print("FFmpeg error:", stderr.decode())
             return input_path, temp_files
 
         return zoom_output, temp_files
 
     except Exception as e:
-        print(f"Error in zoom_in: {str(e)}")
         traceback.print_exc()
         return input_path, temp_files
Original file line number	Diff line number	Diff line change
`@@ -1699,7 +1699,7 @@ async def process_recording(`
`1699`	`1699`	`"zoom_bottom_right_x": form.get("zoom_bottom_right_x"),`
`1700`	`1700`	`"zoom_bottom_right_y": form.get("zoom_bottom_right_y"),`
`1701`	`1701`	`"zoom_duration": form.get("zoom_duration"),`
`1702`		`- "zoom_timestamp": form.get("zoom_timestamp"),`
	`1702`	`+ "zoom_start_frame": form.get("zoom_start_frame"),`
`1703`	`1703`	`}`
`1704`	`1704`
`1705`	`1705`	`print("Zoom parameters in request:", {k: v for k, v in params.items() if k.startswith("zoom_")})`