feat(main.py): enhance seeking and playback controls for improved user experience
This commit is contained in:
241
main.py
241
main.py
@@ -8,22 +8,26 @@ import time
|
||||
from pathlib import Path
|
||||
from typing import List, Tuple, Optional
|
||||
|
||||
|
||||
class MediaGrader:
|
||||
# Configuration constants
|
||||
DEFAULT_FPS = 30
|
||||
BASE_FRAME_DELAY_MS = 33 # ~30 FPS
|
||||
KEY_REPEAT_THRESHOLD_SEC = 0.5
|
||||
KEY_REPEAT_THRESHOLD_SEC = 0.2 # Faster detection for repeat
|
||||
FAST_SEEK_ACTIVATION_TIME = 0.5 # How long to hold before fast seek
|
||||
WINDOW_MAX_WIDTH = 1200
|
||||
WINDOW_MAX_HEIGHT = 800
|
||||
WINDOW_MAX_SCALE_UP = 2.0
|
||||
SPEED_INCREMENT = 0.1
|
||||
MIN_PLAYBACK_SPEED = 0.1
|
||||
MAX_PLAYBACK_SPEED = 100.0
|
||||
FAST_SEEK_MULTIPLIER = 500
|
||||
FAST_SEEK_MULTIPLIER = 5
|
||||
IFRAME_SNAP_INTERVAL = 30
|
||||
IMAGE_DISPLAY_DELAY_MS = 100
|
||||
|
||||
def __init__(self, directory: str, seek_frames: int = 30, snap_to_iframe: bool = False):
|
||||
def __init__(
|
||||
self, directory: str, seek_frames: int = 30, snap_to_iframe: bool = False
|
||||
):
|
||||
self.directory = Path(directory)
|
||||
self.seek_frames = seek_frames
|
||||
self.snap_to_iframe = snap_to_iframe
|
||||
@@ -38,6 +42,7 @@ class MediaGrader:
|
||||
# Key repeat tracking
|
||||
self.last_key_time = 0
|
||||
self.last_key = None
|
||||
self.key_first_press_time = 0
|
||||
|
||||
# Seeking modes
|
||||
self.fine_seek_frames = 1 # Frame-by-frame
|
||||
@@ -45,7 +50,16 @@ class MediaGrader:
|
||||
self.fast_seek_frames = self.seek_frames * self.FAST_SEEK_MULTIPLIER
|
||||
|
||||
# Supported media extensions
|
||||
self.extensions = ['*.png', '*.jpg', '*.jpeg', '*.gif', '*.mp4', '*.avi', '*.mov', '*.mkv']
|
||||
self.extensions = [
|
||||
"*.png",
|
||||
"*.jpg",
|
||||
"*.jpeg",
|
||||
"*.gif",
|
||||
"*.mp4",
|
||||
"*.avi",
|
||||
"*.mov",
|
||||
"*.mkv",
|
||||
]
|
||||
|
||||
# Create grade directories
|
||||
for i in range(1, 6):
|
||||
@@ -64,24 +78,32 @@ class MediaGrader:
|
||||
filtered_files = []
|
||||
for file in media_files:
|
||||
# Check if file is not in a grade directory (1-5)
|
||||
if not any(part in ['1', '2', '3', '4', '5'] for part in file.parts):
|
||||
if not any(part in ["1", "2", "3", "4", "5"] for part in file.parts):
|
||||
filtered_files.append(file)
|
||||
|
||||
return sorted(filtered_files)
|
||||
|
||||
def is_video(self, file_path: Path) -> bool:
|
||||
"""Check if file is a video"""
|
||||
return file_path.suffix.lower() in ['.mp4', '.avi', '.mov', '.mkv', '.gif']
|
||||
return file_path.suffix.lower() in [".mp4", ".avi", ".mov", ".mkv", ".gif"]
|
||||
|
||||
def calculate_frame_delay(self) -> int:
|
||||
"""Calculate frame delay in milliseconds based on playback speed"""
|
||||
if not self.is_playing:
|
||||
return 0 # No delay when paused
|
||||
|
||||
# Base delay for 30 FPS, adjusted by playback speed
|
||||
delay_ms = int(self.BASE_FRAME_DELAY_MS / self.playback_speed)
|
||||
return max(1, delay_ms) # Minimum 1ms delay
|
||||
|
||||
def calculate_frames_to_skip(self) -> int:
|
||||
"""Calculate how many frames to skip for high-speed playback"""
|
||||
if self.playback_speed <= 1.0:
|
||||
return 0
|
||||
elif self.playback_speed <= 2.0:
|
||||
return 0 # No skipping for moderate speeds
|
||||
elif self.playback_speed <= 5.0:
|
||||
return int(self.playback_speed - 1) # Skip some frames
|
||||
else:
|
||||
return int(self.playback_speed * 2) # Skip many frames for very high speeds
|
||||
|
||||
def load_media(self, file_path: Path) -> bool:
|
||||
"""Load media file for display"""
|
||||
if self.current_cap:
|
||||
@@ -107,6 +129,10 @@ class MediaGrader:
|
||||
if not self.current_cap:
|
||||
return None
|
||||
|
||||
# For high-speed playback, skip frames
|
||||
frames_to_skip = self.calculate_frames_to_skip()
|
||||
|
||||
for _ in range(frames_to_skip + 1): # +1 to read at least one frame
|
||||
ret, frame = self.current_cap.read()
|
||||
if not ret:
|
||||
return False, None
|
||||
@@ -125,8 +151,12 @@ class MediaGrader:
|
||||
height, width = frame.shape[:2]
|
||||
|
||||
# Calculate scaling factor to fit within max dimensions
|
||||
scale_w = self.WINDOW_MAX_WIDTH / width if width > self.WINDOW_MAX_WIDTH else 1.0
|
||||
scale_h = self.WINDOW_MAX_HEIGHT / height if height > self.WINDOW_MAX_HEIGHT else 1.0
|
||||
scale_w = (
|
||||
self.WINDOW_MAX_WIDTH / width if width > self.WINDOW_MAX_WIDTH else 1.0
|
||||
)
|
||||
scale_h = (
|
||||
self.WINDOW_MAX_HEIGHT / height if height > self.WINDOW_MAX_HEIGHT else 1.0
|
||||
)
|
||||
scale = min(scale_w, scale_h)
|
||||
|
||||
# Don't scale up small images too much
|
||||
@@ -136,14 +166,18 @@ class MediaGrader:
|
||||
new_width = int(width * scale)
|
||||
new_height = int(height * scale)
|
||||
|
||||
cv2.resizeWindow('Media Grader', new_width, new_height)
|
||||
cv2.resizeWindow("Media Grader", new_width, new_height)
|
||||
|
||||
def seek_video(self, frames_delta: int):
|
||||
"""Seek video by specified number of frames"""
|
||||
if not self.current_cap or not self.is_video(self.media_files[self.current_index]):
|
||||
if not self.current_cap or not self.is_video(
|
||||
self.media_files[self.current_index]
|
||||
):
|
||||
return
|
||||
|
||||
new_frame = max(0, min(self.current_frame + frames_delta, self.total_frames - 1))
|
||||
new_frame = max(
|
||||
0, min(self.current_frame + frames_delta, self.total_frames - 1)
|
||||
)
|
||||
|
||||
if self.snap_to_iframe and frames_delta < 0:
|
||||
# Find previous I-frame (approximation)
|
||||
@@ -151,6 +185,7 @@ class MediaGrader:
|
||||
|
||||
self.current_cap.set(cv2.CAP_PROP_POS_FRAMES, new_frame)
|
||||
self.current_frame = new_frame
|
||||
print(f"Seeked by {frames_delta} frames to frame {new_frame}")
|
||||
|
||||
def handle_seeking_key(self, key: int) -> bool:
|
||||
"""Handle seeking keys with different granularities. Returns True if key was handled."""
|
||||
@@ -158,30 +193,53 @@ class MediaGrader:
|
||||
|
||||
# Determine seek amount based on key and timing
|
||||
seek_amount = 0
|
||||
is_arrow_key = False
|
||||
|
||||
# Try different arrow key detection methods
|
||||
if key == 2424832 or key == 81: # Left arrow (different systems)
|
||||
if self.last_key == key and (current_time - self.last_key_time) < self.KEY_REPEAT_THRESHOLD_SEC:
|
||||
seek_amount = -self.fast_seek_frames
|
||||
else:
|
||||
seek_amount = -self.coarse_seek_frames
|
||||
elif key == 2555904 or key == 83: # Right arrow (different systems)
|
||||
if self.last_key == key and (current_time - self.last_key_time) < self.KEY_REPEAT_THRESHOLD_SEC:
|
||||
seek_amount = self.fast_seek_frames
|
||||
else:
|
||||
seek_amount = self.coarse_seek_frames
|
||||
elif key == ord(','): # Comma - fine seek backward
|
||||
if key == ord("a"): # Left arrow (various systems)
|
||||
is_arrow_key = True
|
||||
direction = -1
|
||||
elif key == ord("d"): # Right arrow (various systems)
|
||||
is_arrow_key = True
|
||||
direction = 1
|
||||
elif key == ord(","): # Comma - fine seek backward
|
||||
seek_amount = -self.fine_seek_frames
|
||||
elif key == ord('.'): # Period - fine seek forward
|
||||
elif key == ord("."): # Period - fine seek forward
|
||||
seek_amount = self.fine_seek_frames
|
||||
else:
|
||||
return False
|
||||
|
||||
self.seek_video(seek_amount)
|
||||
if is_arrow_key:
|
||||
# Track key press timing for fast seek detection
|
||||
if self.last_key != key:
|
||||
# New key press
|
||||
self.key_first_press_time = current_time
|
||||
self.last_key = key
|
||||
seek_amount = direction * self.coarse_seek_frames
|
||||
else:
|
||||
# Repeated key press
|
||||
time_held = current_time - self.key_first_press_time
|
||||
time_since_last = current_time - self.last_key_time
|
||||
|
||||
print(
|
||||
f"Key held for {time_held:.2f}s, since last: {time_since_last:.2f}s"
|
||||
)
|
||||
|
||||
if time_held > self.FAST_SEEK_ACTIVATION_TIME:
|
||||
# Fast seek mode
|
||||
seek_amount = direction * self.fast_seek_frames
|
||||
print(f"FAST SEEK: {seek_amount} frames")
|
||||
else:
|
||||
# Normal seek
|
||||
seek_amount = direction * self.coarse_seek_frames
|
||||
|
||||
if seek_amount != 0:
|
||||
self.seek_video(seek_amount)
|
||||
self.last_key_time = current_time
|
||||
return True
|
||||
|
||||
return False
|
||||
|
||||
def grade_media(self, grade: int):
|
||||
"""Move current media file to grade directory"""
|
||||
if not self.media_files or grade < 1 or grade > 5:
|
||||
@@ -230,7 +288,7 @@ class MediaGrader:
|
||||
print(f"Found {len(self.media_files)} media files")
|
||||
print("Controls:")
|
||||
print(" Space: Pause/Play")
|
||||
print(" Left/Right: Seek backward/forward (accelerates on repeat)")
|
||||
print(" Left/Right: Seek backward/forward (hold for FAST seek)")
|
||||
print(" , / . : Frame-by-frame seek (fine control)")
|
||||
print(" A/D: Decrease/Increase playback speed")
|
||||
print(" 1-5: Grade and move file")
|
||||
@@ -238,7 +296,7 @@ class MediaGrader:
|
||||
print(" P: Previous file")
|
||||
print(" Q/ESC: Quit")
|
||||
|
||||
cv2.namedWindow('Media Grader', cv2.WINDOW_NORMAL)
|
||||
cv2.namedWindow("Media Grader", cv2.WINDOW_NORMAL)
|
||||
|
||||
while self.media_files and self.current_index < len(self.media_files):
|
||||
current_file = self.media_files[self.current_index]
|
||||
@@ -249,13 +307,12 @@ class MediaGrader:
|
||||
continue
|
||||
|
||||
window_title = f"Media Grader - {current_file.name} ({self.current_index + 1}/{len(self.media_files)})"
|
||||
cv2.setWindowTitle('Media Grader', window_title)
|
||||
cv2.setWindowTitle("Media Grader", window_title)
|
||||
|
||||
window_resized = False
|
||||
|
||||
while True:
|
||||
# Only advance frame if playing (for videos)
|
||||
if self.is_playing or not self.is_video(current_file):
|
||||
# Always try to get and display a frame (for seeking while paused)
|
||||
result = self.display_media(current_file)
|
||||
if result is None or not result[0]:
|
||||
break
|
||||
@@ -269,18 +326,58 @@ class MediaGrader:
|
||||
|
||||
# Add info overlay
|
||||
info_text = f"Speed: {self.playback_speed:.1f}x | Frame: {self.current_frame}/{self.total_frames} | File: {self.current_index + 1}/{len(self.media_files)}"
|
||||
help_text = "Seek: ←→ (accel) ,. (fine) | A/D speed | 1-5 grade | Space pause | Q quit"
|
||||
help_text = "Seek: ←→ (hold=FAST) ,. (fine) | A/D speed | 1-5 grade | Space pause | Q quit"
|
||||
|
||||
# White background for text visibility
|
||||
cv2.putText(frame, info_text, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (255, 255, 255), 2)
|
||||
cv2.putText(frame, info_text, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 0), 1)
|
||||
cv2.putText(frame, help_text, (10, 60), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 255, 255), 2)
|
||||
cv2.putText(frame, help_text, (10, 60), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1)
|
||||
cv2.putText(
|
||||
frame,
|
||||
info_text,
|
||||
(10, 30),
|
||||
cv2.FONT_HERSHEY_SIMPLEX,
|
||||
0.7,
|
||||
(255, 255, 255),
|
||||
2,
|
||||
)
|
||||
cv2.putText(
|
||||
frame,
|
||||
info_text,
|
||||
(10, 30),
|
||||
cv2.FONT_HERSHEY_SIMPLEX,
|
||||
0.7,
|
||||
(0, 0, 0),
|
||||
1,
|
||||
)
|
||||
cv2.putText(
|
||||
frame,
|
||||
help_text,
|
||||
(10, 60),
|
||||
cv2.FONT_HERSHEY_SIMPLEX,
|
||||
0.5,
|
||||
(255, 255, 255),
|
||||
2,
|
||||
)
|
||||
cv2.putText(
|
||||
frame,
|
||||
help_text,
|
||||
(10, 60),
|
||||
cv2.FONT_HERSHEY_SIMPLEX,
|
||||
0.5,
|
||||
(0, 0, 0),
|
||||
1,
|
||||
)
|
||||
|
||||
cv2.imshow('Media Grader', frame)
|
||||
cv2.imshow("Media Grader", frame)
|
||||
|
||||
# Calculate appropriate delay
|
||||
delay = self.calculate_frame_delay() if self.is_video(current_file) else self.IMAGE_DISPLAY_DELAY_MS
|
||||
# Calculate appropriate delay - shorter for paused videos to enable seeking
|
||||
if self.is_video(current_file):
|
||||
if self.is_playing:
|
||||
delay = self.calculate_frame_delay()
|
||||
else:
|
||||
delay = (
|
||||
30 # Short delay when paused to enable responsive seeking
|
||||
)
|
||||
else:
|
||||
delay = self.IMAGE_DISPLAY_DELAY_MS
|
||||
|
||||
key = cv2.waitKey(delay) & 0xFF
|
||||
|
||||
@@ -288,29 +385,49 @@ class MediaGrader:
|
||||
if key != 255: # 255 means no key pressed
|
||||
print(f"Key pressed: {key}")
|
||||
|
||||
if key == ord('q') or key == 27: # Q or ESC
|
||||
if key == ord("q") or key == 27: # Q or ESC
|
||||
return
|
||||
elif key == ord(' '): # Space - pause/play
|
||||
elif key == ord(" "): # Space - pause/play
|
||||
self.is_playing = not self.is_playing
|
||||
elif key == ord('a'): # A - decrease speed
|
||||
self.playback_speed = max(self.MIN_PLAYBACK_SPEED, self.playback_speed - self.SPEED_INCREMENT)
|
||||
elif key == ord('d'): # D - increase speed
|
||||
self.playback_speed = min(self.MAX_PLAYBACK_SPEED, self.playback_speed + self.SPEED_INCREMENT)
|
||||
print(f"{'Playing' if self.is_playing else 'Paused'}")
|
||||
elif key == ord("w"): # A - decrease speed
|
||||
self.playback_speed = max(
|
||||
self.MIN_PLAYBACK_SPEED,
|
||||
self.playback_speed - self.SPEED_INCREMENT,
|
||||
)
|
||||
print(f"Speed: {self.playback_speed:.1f}x")
|
||||
elif key == ord("s"): # D - increase speed
|
||||
self.playback_speed = min(
|
||||
self.MAX_PLAYBACK_SPEED,
|
||||
self.playback_speed + self.SPEED_INCREMENT,
|
||||
)
|
||||
print(f"Speed: {self.playback_speed:.1f}x")
|
||||
elif self.handle_seeking_key(key):
|
||||
# Seeking was handled
|
||||
pass
|
||||
elif key == ord('n'): # Next file
|
||||
elif key == ord("n"): # Next file
|
||||
break
|
||||
elif key == ord('p'): # Previous file
|
||||
elif key == ord("p"): # Previous file
|
||||
self.current_index = max(0, self.current_index - 1)
|
||||
break
|
||||
elif key in [ord('1'), ord('2'), ord('3'), ord('4'), ord('5')]: # Grade
|
||||
elif key in [ord("1"), ord("2"), ord("3"), ord("4"), ord("5")]: # Grade
|
||||
grade = int(chr(key))
|
||||
if not self.grade_media(grade):
|
||||
return
|
||||
break
|
||||
elif key == 255: # No key pressed
|
||||
# Reset key tracking if no key is pressed
|
||||
if self.last_key is not None:
|
||||
self.last_key = None
|
||||
print("Key released")
|
||||
|
||||
if key not in [ord('p')]: # Don't increment for previous
|
||||
# Only advance to next frame if playing AND it's a video
|
||||
if not self.is_playing and self.is_video(current_file):
|
||||
# When paused, seek back one frame to stay on current frame
|
||||
# (since display_media already advanced us)
|
||||
continue
|
||||
|
||||
if key not in [ord("p")]: # Don't increment for previous
|
||||
self.current_index += 1
|
||||
|
||||
if self.current_cap:
|
||||
@@ -321,10 +438,26 @@ class MediaGrader:
|
||||
|
||||
|
||||
def main():
|
||||
parser = argparse.ArgumentParser(description='Media Grader - Grade media files by moving them to numbered folders')
|
||||
parser.add_argument('directory', nargs='?', default='.', help='Directory to scan for media files (default: current directory)')
|
||||
parser.add_argument('--seek-frames', type=int, default=30, help='Number of frames to seek when using arrow keys (default: 30)')
|
||||
parser.add_argument('--snap-to-iframe', action='store_true', help='Snap to I-frames when seeking backward for better performance')
|
||||
parser = argparse.ArgumentParser(
|
||||
description="Media Grader - Grade media files by moving them to numbered folders"
|
||||
)
|
||||
parser.add_argument(
|
||||
"directory",
|
||||
nargs="?",
|
||||
default=".",
|
||||
help="Directory to scan for media files (default: current directory)",
|
||||
)
|
||||
parser.add_argument(
|
||||
"--seek-frames",
|
||||
type=int,
|
||||
default=30,
|
||||
help="Number of frames to seek when using arrow keys (default: 30)",
|
||||
)
|
||||
parser.add_argument(
|
||||
"--snap-to-iframe",
|
||||
action="store_true",
|
||||
help="Snap to I-frames when seeking backward for better performance",
|
||||
)
|
||||
|
||||
args = parser.parse_args()
|
||||
|
||||
|
Reference in New Issue
Block a user