feat(main.py): enhance seeking and playback controls for improved user experience

This commit is contained in:
2025-08-18 16:33:50 +02:00
parent 0a048d3078
commit e2758b5390

241
main.py
View File

@@ -8,22 +8,26 @@ import time
from pathlib import Path
from typing import List, Tuple, Optional
class MediaGrader:
# Configuration constants
DEFAULT_FPS = 30
BASE_FRAME_DELAY_MS = 33 # ~30 FPS
KEY_REPEAT_THRESHOLD_SEC = 0.5
KEY_REPEAT_THRESHOLD_SEC = 0.2 # Faster detection for repeat
FAST_SEEK_ACTIVATION_TIME = 0.5 # How long to hold before fast seek
WINDOW_MAX_WIDTH = 1200
WINDOW_MAX_HEIGHT = 800
WINDOW_MAX_SCALE_UP = 2.0
SPEED_INCREMENT = 0.1
MIN_PLAYBACK_SPEED = 0.1
MAX_PLAYBACK_SPEED = 100.0
FAST_SEEK_MULTIPLIER = 500
FAST_SEEK_MULTIPLIER = 5
IFRAME_SNAP_INTERVAL = 30
IMAGE_DISPLAY_DELAY_MS = 100
def __init__(self, directory: str, seek_frames: int = 30, snap_to_iframe: bool = False):
def __init__(
self, directory: str, seek_frames: int = 30, snap_to_iframe: bool = False
):
self.directory = Path(directory)
self.seek_frames = seek_frames
self.snap_to_iframe = snap_to_iframe
@@ -38,6 +42,7 @@ class MediaGrader:
# Key repeat tracking
self.last_key_time = 0
self.last_key = None
self.key_first_press_time = 0
# Seeking modes
self.fine_seek_frames = 1 # Frame-by-frame
@@ -45,7 +50,16 @@ class MediaGrader:
self.fast_seek_frames = self.seek_frames * self.FAST_SEEK_MULTIPLIER
# Supported media extensions
self.extensions = ['*.png', '*.jpg', '*.jpeg', '*.gif', '*.mp4', '*.avi', '*.mov', '*.mkv']
self.extensions = [
"*.png",
"*.jpg",
"*.jpeg",
"*.gif",
"*.mp4",
"*.avi",
"*.mov",
"*.mkv",
]
# Create grade directories
for i in range(1, 6):
@@ -64,24 +78,32 @@ class MediaGrader:
filtered_files = []
for file in media_files:
# Check if file is not in a grade directory (1-5)
if not any(part in ['1', '2', '3', '4', '5'] for part in file.parts):
if not any(part in ["1", "2", "3", "4", "5"] for part in file.parts):
filtered_files.append(file)
return sorted(filtered_files)
def is_video(self, file_path: Path) -> bool:
"""Check if file is a video"""
return file_path.suffix.lower() in ['.mp4', '.avi', '.mov', '.mkv', '.gif']
return file_path.suffix.lower() in [".mp4", ".avi", ".mov", ".mkv", ".gif"]
def calculate_frame_delay(self) -> int:
"""Calculate frame delay in milliseconds based on playback speed"""
if not self.is_playing:
return 0 # No delay when paused
# Base delay for 30 FPS, adjusted by playback speed
delay_ms = int(self.BASE_FRAME_DELAY_MS / self.playback_speed)
return max(1, delay_ms) # Minimum 1ms delay
def calculate_frames_to_skip(self) -> int:
"""Calculate how many frames to skip for high-speed playback"""
if self.playback_speed <= 1.0:
return 0
elif self.playback_speed <= 2.0:
return 0 # No skipping for moderate speeds
elif self.playback_speed <= 5.0:
return int(self.playback_speed - 1) # Skip some frames
else:
return int(self.playback_speed * 2) # Skip many frames for very high speeds
def load_media(self, file_path: Path) -> bool:
"""Load media file for display"""
if self.current_cap:
@@ -107,6 +129,10 @@ class MediaGrader:
if not self.current_cap:
return None
# For high-speed playback, skip frames
frames_to_skip = self.calculate_frames_to_skip()
for _ in range(frames_to_skip + 1): # +1 to read at least one frame
ret, frame = self.current_cap.read()
if not ret:
return False, None
@@ -125,8 +151,12 @@ class MediaGrader:
height, width = frame.shape[:2]
# Calculate scaling factor to fit within max dimensions
scale_w = self.WINDOW_MAX_WIDTH / width if width > self.WINDOW_MAX_WIDTH else 1.0
scale_h = self.WINDOW_MAX_HEIGHT / height if height > self.WINDOW_MAX_HEIGHT else 1.0
scale_w = (
self.WINDOW_MAX_WIDTH / width if width > self.WINDOW_MAX_WIDTH else 1.0
)
scale_h = (
self.WINDOW_MAX_HEIGHT / height if height > self.WINDOW_MAX_HEIGHT else 1.0
)
scale = min(scale_w, scale_h)
# Don't scale up small images too much
@@ -136,14 +166,18 @@ class MediaGrader:
new_width = int(width * scale)
new_height = int(height * scale)
cv2.resizeWindow('Media Grader', new_width, new_height)
cv2.resizeWindow("Media Grader", new_width, new_height)
def seek_video(self, frames_delta: int):
"""Seek video by specified number of frames"""
if not self.current_cap or not self.is_video(self.media_files[self.current_index]):
if not self.current_cap or not self.is_video(
self.media_files[self.current_index]
):
return
new_frame = max(0, min(self.current_frame + frames_delta, self.total_frames - 1))
new_frame = max(
0, min(self.current_frame + frames_delta, self.total_frames - 1)
)
if self.snap_to_iframe and frames_delta < 0:
# Find previous I-frame (approximation)
@@ -151,6 +185,7 @@ class MediaGrader:
self.current_cap.set(cv2.CAP_PROP_POS_FRAMES, new_frame)
self.current_frame = new_frame
print(f"Seeked by {frames_delta} frames to frame {new_frame}")
def handle_seeking_key(self, key: int) -> bool:
"""Handle seeking keys with different granularities. Returns True if key was handled."""
@@ -158,30 +193,53 @@ class MediaGrader:
# Determine seek amount based on key and timing
seek_amount = 0
is_arrow_key = False
# Try different arrow key detection methods
if key == 2424832 or key == 81: # Left arrow (different systems)
if self.last_key == key and (current_time - self.last_key_time) < self.KEY_REPEAT_THRESHOLD_SEC:
seek_amount = -self.fast_seek_frames
else:
seek_amount = -self.coarse_seek_frames
elif key == 2555904 or key == 83: # Right arrow (different systems)
if self.last_key == key and (current_time - self.last_key_time) < self.KEY_REPEAT_THRESHOLD_SEC:
seek_amount = self.fast_seek_frames
else:
seek_amount = self.coarse_seek_frames
elif key == ord(','): # Comma - fine seek backward
if key == ord("a"): # Left arrow (various systems)
is_arrow_key = True
direction = -1
elif key == ord("d"): # Right arrow (various systems)
is_arrow_key = True
direction = 1
elif key == ord(","): # Comma - fine seek backward
seek_amount = -self.fine_seek_frames
elif key == ord('.'): # Period - fine seek forward
elif key == ord("."): # Period - fine seek forward
seek_amount = self.fine_seek_frames
else:
return False
self.seek_video(seek_amount)
if is_arrow_key:
# Track key press timing for fast seek detection
if self.last_key != key:
# New key press
self.key_first_press_time = current_time
self.last_key = key
seek_amount = direction * self.coarse_seek_frames
else:
# Repeated key press
time_held = current_time - self.key_first_press_time
time_since_last = current_time - self.last_key_time
print(
f"Key held for {time_held:.2f}s, since last: {time_since_last:.2f}s"
)
if time_held > self.FAST_SEEK_ACTIVATION_TIME:
# Fast seek mode
seek_amount = direction * self.fast_seek_frames
print(f"FAST SEEK: {seek_amount} frames")
else:
# Normal seek
seek_amount = direction * self.coarse_seek_frames
if seek_amount != 0:
self.seek_video(seek_amount)
self.last_key_time = current_time
return True
return False
def grade_media(self, grade: int):
"""Move current media file to grade directory"""
if not self.media_files or grade < 1 or grade > 5:
@@ -230,7 +288,7 @@ class MediaGrader:
print(f"Found {len(self.media_files)} media files")
print("Controls:")
print(" Space: Pause/Play")
print(" Left/Right: Seek backward/forward (accelerates on repeat)")
print(" Left/Right: Seek backward/forward (hold for FAST seek)")
print(" , / . : Frame-by-frame seek (fine control)")
print(" A/D: Decrease/Increase playback speed")
print(" 1-5: Grade and move file")
@@ -238,7 +296,7 @@ class MediaGrader:
print(" P: Previous file")
print(" Q/ESC: Quit")
cv2.namedWindow('Media Grader', cv2.WINDOW_NORMAL)
cv2.namedWindow("Media Grader", cv2.WINDOW_NORMAL)
while self.media_files and self.current_index < len(self.media_files):
current_file = self.media_files[self.current_index]
@@ -249,13 +307,12 @@ class MediaGrader:
continue
window_title = f"Media Grader - {current_file.name} ({self.current_index + 1}/{len(self.media_files)})"
cv2.setWindowTitle('Media Grader', window_title)
cv2.setWindowTitle("Media Grader", window_title)
window_resized = False
while True:
# Only advance frame if playing (for videos)
if self.is_playing or not self.is_video(current_file):
# Always try to get and display a frame (for seeking while paused)
result = self.display_media(current_file)
if result is None or not result[0]:
break
@@ -269,18 +326,58 @@ class MediaGrader:
# Add info overlay
info_text = f"Speed: {self.playback_speed:.1f}x | Frame: {self.current_frame}/{self.total_frames} | File: {self.current_index + 1}/{len(self.media_files)}"
help_text = "Seek: ←→ (accel) ,. (fine) | A/D speed | 1-5 grade | Space pause | Q quit"
help_text = "Seek: ←→ (hold=FAST) ,. (fine) | A/D speed | 1-5 grade | Space pause | Q quit"
# White background for text visibility
cv2.putText(frame, info_text, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (255, 255, 255), 2)
cv2.putText(frame, info_text, (10, 30), cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 0), 1)
cv2.putText(frame, help_text, (10, 60), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 255, 255), 2)
cv2.putText(frame, help_text, (10, 60), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1)
cv2.putText(
frame,
info_text,
(10, 30),
cv2.FONT_HERSHEY_SIMPLEX,
0.7,
(255, 255, 255),
2,
)
cv2.putText(
frame,
info_text,
(10, 30),
cv2.FONT_HERSHEY_SIMPLEX,
0.7,
(0, 0, 0),
1,
)
cv2.putText(
frame,
help_text,
(10, 60),
cv2.FONT_HERSHEY_SIMPLEX,
0.5,
(255, 255, 255),
2,
)
cv2.putText(
frame,
help_text,
(10, 60),
cv2.FONT_HERSHEY_SIMPLEX,
0.5,
(0, 0, 0),
1,
)
cv2.imshow('Media Grader', frame)
cv2.imshow("Media Grader", frame)
# Calculate appropriate delay
delay = self.calculate_frame_delay() if self.is_video(current_file) else self.IMAGE_DISPLAY_DELAY_MS
# Calculate appropriate delay - shorter for paused videos to enable seeking
if self.is_video(current_file):
if self.is_playing:
delay = self.calculate_frame_delay()
else:
delay = (
30 # Short delay when paused to enable responsive seeking
)
else:
delay = self.IMAGE_DISPLAY_DELAY_MS
key = cv2.waitKey(delay) & 0xFF
@@ -288,29 +385,49 @@ class MediaGrader:
if key != 255: # 255 means no key pressed
print(f"Key pressed: {key}")
if key == ord('q') or key == 27: # Q or ESC
if key == ord("q") or key == 27: # Q or ESC
return
elif key == ord(' '): # Space - pause/play
elif key == ord(" "): # Space - pause/play
self.is_playing = not self.is_playing
elif key == ord('a'): # A - decrease speed
self.playback_speed = max(self.MIN_PLAYBACK_SPEED, self.playback_speed - self.SPEED_INCREMENT)
elif key == ord('d'): # D - increase speed
self.playback_speed = min(self.MAX_PLAYBACK_SPEED, self.playback_speed + self.SPEED_INCREMENT)
print(f"{'Playing' if self.is_playing else 'Paused'}")
elif key == ord("w"): # A - decrease speed
self.playback_speed = max(
self.MIN_PLAYBACK_SPEED,
self.playback_speed - self.SPEED_INCREMENT,
)
print(f"Speed: {self.playback_speed:.1f}x")
elif key == ord("s"): # D - increase speed
self.playback_speed = min(
self.MAX_PLAYBACK_SPEED,
self.playback_speed + self.SPEED_INCREMENT,
)
print(f"Speed: {self.playback_speed:.1f}x")
elif self.handle_seeking_key(key):
# Seeking was handled
pass
elif key == ord('n'): # Next file
elif key == ord("n"): # Next file
break
elif key == ord('p'): # Previous file
elif key == ord("p"): # Previous file
self.current_index = max(0, self.current_index - 1)
break
elif key in [ord('1'), ord('2'), ord('3'), ord('4'), ord('5')]: # Grade
elif key in [ord("1"), ord("2"), ord("3"), ord("4"), ord("5")]: # Grade
grade = int(chr(key))
if not self.grade_media(grade):
return
break
elif key == 255: # No key pressed
# Reset key tracking if no key is pressed
if self.last_key is not None:
self.last_key = None
print("Key released")
if key not in [ord('p')]: # Don't increment for previous
# Only advance to next frame if playing AND it's a video
if not self.is_playing and self.is_video(current_file):
# When paused, seek back one frame to stay on current frame
# (since display_media already advanced us)
continue
if key not in [ord("p")]: # Don't increment for previous
self.current_index += 1
if self.current_cap:
@@ -321,10 +438,26 @@ class MediaGrader:
def main():
parser = argparse.ArgumentParser(description='Media Grader - Grade media files by moving them to numbered folders')
parser.add_argument('directory', nargs='?', default='.', help='Directory to scan for media files (default: current directory)')
parser.add_argument('--seek-frames', type=int, default=30, help='Number of frames to seek when using arrow keys (default: 30)')
parser.add_argument('--snap-to-iframe', action='store_true', help='Snap to I-frames when seeking backward for better performance')
parser = argparse.ArgumentParser(
description="Media Grader - Grade media files by moving them to numbered folders"
)
parser.add_argument(
"directory",
nargs="?",
default=".",
help="Directory to scan for media files (default: current directory)",
)
parser.add_argument(
"--seek-frames",
type=int,
default=30,
help="Number of frames to seek when using arrow keys (default: 30)",
)
parser.add_argument(
"--snap-to-iframe",
action="store_true",
help="Snap to I-frames when seeking backward for better performance",
)
args = parser.parse_args()