Update transcode_bench.py

This commit is contained in:
2025-10-12 20:17:52 +13:00
parent 4b245ee5bd
commit 084f3d381e

View File

@@ -19,37 +19,100 @@ class HardwareAcceleration:
"""Detect and configure hardware acceleration."""
@staticmethod
def detect() -> Tuple[str, str, str]:
def detect(debug=False) -> Tuple[str, str, str, bool]:
"""
Detect available hardware acceleration.
Returns: (name, encoder, hwaccel_args)
Returns: (name, encoder, hwaccel_args, hw_decode_supported)
"""
warnings = []
if debug:
print("\n=== Hardware Detection Debug ===")
# Check NVIDIA NVENC
if HardwareAcceleration._test_hardware('h264_nvenc', '-hwaccel cuda -hwaccel_output_format cuda'):
return ('NVIDIA NVENC', 'h264_nvenc', '-hwaccel cuda -hwaccel_output_format cuda')
if debug:
print("Testing NVIDIA NVENC...", end=' ')
result = HardwareAcceleration._test_hardware('h264_nvenc', '-hwaccel cuda -hwaccel_output_format cuda', debug)
if result[0]:
if debug:
print("")
return ('NVIDIA NVENC', 'h264_nvenc', '-hwaccel cuda -hwaccel_output_format cuda', True)
if debug:
print("" if result[1] else "not available")
if result[1]:
warnings.append(result[1])
# Check Intel QSV
if HardwareAcceleration._test_hardware('h264_qsv', '-hwaccel qsv -hwaccel_output_format qsv'):
return ('Intel Quick Sync', 'h264_qsv', '-hwaccel qsv -hwaccel_output_format qsv')
if debug:
print("Testing Intel QSV...", end=' ')
result = HardwareAcceleration._test_hardware('h264_qsv', '-hwaccel qsv -hwaccel_output_format qsv', debug)
if result[0]:
if debug:
print("")
return ('Intel Quick Sync', 'h264_qsv', '-hwaccel qsv -hwaccel_output_format qsv', True)
if debug:
print("" if result[1] else "not available")
if result[1]:
warnings.append(result[1])
# Check AMD AMF (Windows/Linux)
if HardwareAcceleration._test_hardware('h264_amf', ''):
return ('AMD AMF', 'h264_amf', '')
if debug:
print("Testing AMD AMF...", end=' ')
result = HardwareAcceleration._test_hardware('h264_amf', '', debug)
if result[0]:
if debug:
print("")
return ('AMD AMF', 'h264_amf', '', True)
if debug:
print("" if result[1] else "not available")
if result[1]:
warnings.append(result[1])
# Check VideoToolbox (macOS/iOS - ARM)
if HardwareAcceleration._test_hardware('h264_videotoolbox', '-hwaccel videotoolbox'):
return ('VideoToolbox', 'h264_videotoolbox', '-hwaccel videotoolbox')
if debug:
print("Testing VideoToolbox...", end=' ')
result = HardwareAcceleration._test_hardware('h264_videotoolbox', '-hwaccel videotoolbox', debug)
if result[0]:
if debug:
print("")
return ('VideoToolbox', 'h264_videotoolbox', '-hwaccel videotoolbox', True)
if debug:
print("" if result[1] else "not available")
if result[1]:
warnings.append(result[1])
# Check VA-API (Linux Intel/AMD)
if HardwareAcceleration._test_hardware('h264_vaapi', '-hwaccel vaapi -hwaccel_output_format vaapi -hwaccel_device /dev/dri/renderD128'):
return ('VA-API', 'h264_vaapi', '-hwaccel vaapi -hwaccel_output_format vaapi -hwaccel_device /dev/dri/renderD128')
if debug:
print("Testing VA-API...", end=' ')
result = HardwareAcceleration._test_vaapi(debug)
if result[0]:
if debug:
print("")
return (result[1], result[2], result[3], result[4]) # return (name, encoder, hwaccel_args, hw_decode)
if debug:
print("" if result[1] else "not available")
if result[1]:
warnings.append(result[1])
if debug:
print("=== End Debug ===\n")
# Print warnings if we fell back to software
if warnings:
print("\nNote: Hardware acceleration not available:")
for warning in warnings:
print(f" - {warning}")
print()
# Fallback to software
return ('Software (libx264)', 'libx264', '')
return ('Software (libx264)', 'libx264', '', False)
@staticmethod
def _test_hardware(encoder: str, hwaccel_args: str) -> bool:
"""Test if hardware encoder is actually available by attempting to use it."""
def _test_hardware(encoder: str, hwaccel_args: str, debug=False) -> Tuple[bool, Optional[str]]:
"""
Test if hardware encoder is actually available by attempting to use it.
Returns: (success, warning_message)
"""
try:
# Build a quick test encode command
cmd = ['ffmpeg', '-y', '-hide_banner', '-loglevel', 'error']
@@ -73,9 +136,155 @@ class HardwareAcceleration:
capture_output=True,
timeout=10
)
return result.returncode == 0
except (subprocess.TimeoutExpired, FileNotFoundError, Exception):
return False
if debug and result.returncode != 0:
print(f"\n Error: {result.stderr.decode() if result.stderr else 'Unknown error'}")
return (result.returncode == 0, None)
except (subprocess.TimeoutExpired, FileNotFoundError, Exception) as e:
if debug:
print(f"\n Exception: {e}")
return (False, None)
@staticmethod
def _test_vaapi(debug=False) -> Tuple:
"""
Test VA-API with better error handling and permission checks.
Returns: (name, encoder, hwaccel_args) if success or (False, warning, '')
"""
# Check if VA-API encoder is available in FFmpeg
try:
result = subprocess.run(
['ffmpeg', '-hide_banner', '-encoders'],
capture_output=True,
text=True,
timeout=5
)
if 'h264_vaapi' not in result.stdout:
if debug:
print("\n h264_vaapi encoder not found in FFmpeg")
return (False, None, '')
except Exception as e:
if debug:
print(f"\n Error checking encoders: {e}")
return (False, None, '')
# Check for /dev/dri devices
dri_devices = []
try:
dri_path = Path('/dev/dri')
if dri_path.exists():
dri_devices = sorted([str(d) for d in dri_path.glob('renderD*')])
except Exception as e:
if debug:
print(f"\n Error checking /dev/dri: {e}")
pass
if not dri_devices:
if debug:
print("\n No /dev/dri/renderD* devices found")
return (False, None, '')
# Check permissions on first device
device = dri_devices[0]
if debug:
print(f"\n Found device: {device}")
print(f" Can read: {os.access(device, os.R_OK)}")
print(f" Can write: {os.access(device, os.W_OK)}")
print(f" Process groups: {os.getgroups()}")
if not os.access(device, os.R_OK | os.W_OK):
return (False,
f"VA-API device {device} exists but not accessible. Run: sudo usermod -a -G render $USER (then logout/login)",
'')
# Test VA-API for both encoding and decoding
try:
with tempfile.NamedTemporaryFile(suffix='.mp4', delete=False) as f:
test_video = f.name
if debug:
print(f" Creating test video for VA-API...")
# First create a small H.264 test video using software encoding
cmd1 = [
'ffmpeg', '-y', '-hide_banner', '-loglevel', 'error',
'-f', 'lavfi',
'-i', 'testsrc2=size=1920x1080:duration=0.1:rate=1',
'-frames:v', '2',
'-c:v', 'libx264',
'-preset', 'ultrafast',
test_video
]
result1 = subprocess.run(cmd1, capture_output=True, timeout=5)
if debug:
print(f" Test video creation: {'success' if result1.returncode == 0 else 'failed'}")
if result1.returncode != 0:
print(f" Error: {result1.stderr.decode() if result1.stderr else 'Unknown'}")
if result1.returncode == 0:
# Test 1: HW decode + HW encode
if debug:
print(f" Testing VA-API HW decode + HW encode...")
cmd2 = [
'ffmpeg', '-y', '-hide_banner', '-loglevel', 'error',
'-vaapi_device', device,
'-hwaccel', 'vaapi',
'-hwaccel_output_format', 'vaapi',
'-i', test_video,
'-frames:v', '1',
'-c:v', 'h264_vaapi',
'-f', 'null',
'-' if os.name != 'nt' else 'NUL'
]
result2 = subprocess.run(cmd2, capture_output=True, timeout=5)
if debug:
print(f" HW decode + HW encode: {'success' if result2.returncode == 0 else 'failed'}")
if result2.returncode != 0:
print(f" Error: {result2.stderr.decode() if result2.stderr else 'Unknown'}")
# Test 2: SW decode + HW encode (fallback if HW decode doesn't work)
hw_decode_works = result2.returncode == 0
if not hw_decode_works:
if debug:
print(f" Testing VA-API SW decode + HW encode...")
cmd3 = [
'ffmpeg', '-y', '-hide_banner', '-loglevel', 'error',
'-vaapi_device', device,
'-i', test_video,
'-vf', 'format=nv12,hwupload',
'-frames:v', '1',
'-c:v', 'h264_vaapi',
'-f', 'null',
'-' if os.name != 'nt' else 'NUL'
]
result3 = subprocess.run(cmd3, capture_output=True, timeout=5)
if debug:
print(f" SW decode + HW encode: {'success' if result3.returncode == 0 else 'failed'}")
if result3.returncode != 0:
print(f" Error: {result3.stderr.decode() if result3.stderr else 'Unknown'}")
if result3.returncode == 0:
os.unlink(test_video)
return (True, 'VA-API (Intel/AMD) [SW decode + HW encode]', 'h264_vaapi',
f'-vaapi_device {device}', False)
os.unlink(test_video)
if hw_decode_works:
return (True, 'VA-API (Intel/AMD) [HW decode + HW encode]', 'h264_vaapi',
f'-vaapi_device {device} -hwaccel vaapi -hwaccel_output_format vaapi', True)
if os.path.exists(test_video):
os.unlink(test_video)
except Exception as e:
if debug:
print(f" Exception during VA-API test: {e}")
pass
return (False, None, '', '', False)
class TestVideo:
@@ -108,11 +317,12 @@ class TestVideo:
class TranscodeJob:
"""Represents a single transcode job."""
def __init__(self, input_file: str, output_file: str, encoder: str, hwaccel_args: str):
def __init__(self, input_file: str, output_file: str, encoder: str, hwaccel_args: str, hw_decode: bool):
self.input_file = input_file
self.output_file = output_file
self.encoder = encoder
self.hwaccel_args = hwaccel_args
self.hw_decode = hw_decode
self.process = None
self.start_time = None
self.end_time = None
@@ -125,12 +335,17 @@ class TranscodeJob:
# Build FFmpeg command
cmd = ['ffmpeg', '-y']
# Add hardware acceleration args
# Add hardware acceleration args (before input)
if self.hwaccel_args:
cmd.extend(self.hwaccel_args.split())
cmd.extend(['-i', self.input_file])
# For VA-API without HW decode, we need to upload to hardware
if 'vaapi' in self.encoder and not self.hw_decode:
cmd.extend(['-vf', 'format=nv12,hwupload'])
cmd.extend([
'-i', self.input_file,
'-c:v', self.encoder,
'-b:v', '4M',
'-c:a', 'aac',
@@ -175,11 +390,12 @@ class TranscodeJob:
class Benchmark:
"""Main benchmark orchestrator."""
def __init__(self, test_video: str, encoder: str, hwaccel_args: str, accel_name: str):
def __init__(self, test_video: str, encoder: str, hwaccel_args: str, accel_name: str, hw_decode: bool):
self.test_video = test_video
self.encoder = encoder
self.hwaccel_args = hwaccel_args
self.accel_name = accel_name
self.hw_decode = hw_decode
def run_parallel_transcodes(self, num_streams: int, timeout: int = 60) -> Tuple[bool, float]:
"""
@@ -192,7 +408,7 @@ class Benchmark:
# Create jobs
for i in range(num_streams):
output_file = f'/dev/null' if os.name != 'nt' else 'NUL'
job = TranscodeJob(self.test_video, output_file, self.encoder, self.hwaccel_args)
job = TranscodeJob(self.test_video, output_file, self.encoder, self.hwaccel_args, self.hw_decode)
jobs.append(job)
# Start all jobs in parallel
@@ -272,6 +488,11 @@ def main():
default=30.0,
help='Minimum FPS to consider real-time (default: 30.0)'
)
parser.add_argument(
'--debug',
action='store_true',
help='Enable debug output for hardware detection'
)
args = parser.parse_args()
@@ -287,7 +508,7 @@ def main():
print("=" * 60)
# Detect hardware acceleration
accel_name, encoder, hwaccel_args = HardwareAcceleration.detect()
accel_name, encoder, hwaccel_args, hw_decode = HardwareAcceleration.detect(debug=args.debug)
print(f"Detected acceleration: {accel_name}")
print(f"Encoder: {encoder}")