McRogueFace/tests/run_tests.py

268 lines
9 KiB
Python

#!/usr/bin/env python3
"""
McRogueFace Test Runner
Runs all headless tests and reports results.
Usage:
python3 tests/run_tests.py # Run all tests
python3 tests/run_tests.py unit # Run only unit tests
python3 tests/run_tests.py -v # Verbose output (show failure details)
python3 tests/run_tests.py --checksums # Show screenshot checksums
python3 tests/run_tests.py --timeout=30 # Custom timeout
python3 tests/run_tests.py --sanitizer # Detect ASan/UBSan errors in output
python3 tests/run_tests.py --valgrind # Run tests under Valgrind memcheck
Environment variables:
MCRF_BUILD_DIR Build directory (default: ../build)
MCRF_LIB_DIR Library directory for LD_LIBRARY_PATH (default: ../__lib)
MCRF_TIMEOUT_MULTIPLIER Multiply per-test timeout (default: 1, use 50 for valgrind)
"""
import os
import subprocess
import sys
import time
import hashlib
import re
from pathlib import Path
# Configuration — respect environment overrides for debug/sanitizer builds
TESTS_DIR = Path(__file__).parent
BUILD_DIR = Path(os.environ.get('MCRF_BUILD_DIR', str(TESTS_DIR.parent / "build")))
LIB_DIR = Path(os.environ.get('MCRF_LIB_DIR', str(TESTS_DIR.parent / "__lib")))
MCROGUEFACE = BUILD_DIR / "mcrogueface"
DEFAULT_TIMEOUT = 10 # seconds per test
# Sanitizer error patterns to scan for in stderr
SANITIZER_PATTERNS = [
re.compile(r'ERROR: AddressSanitizer'),
re.compile(r'ERROR: LeakSanitizer'),
re.compile(r'runtime error:'), # UBSan
re.compile(r'ERROR: ThreadSanitizer'),
]
# Test directories to run (in order)
TEST_DIRS = ['unit', 'integration', 'regression']
# ANSI colors
GREEN = '\033[92m'
RED = '\033[91m'
YELLOW = '\033[93m'
RESET = '\033[0m'
BOLD = '\033[1m'
def get_screenshot_checksum(test_dir):
"""Get checksums of test-generated PNG files in build directory."""
checksums = {}
for png in BUILD_DIR.glob("test_*.png"):
with open(png, 'rb') as f:
checksums[png.name] = hashlib.md5(f.read()).hexdigest()[:8]
return checksums
def check_sanitizer_output(output):
"""Check output for sanitizer error messages. Returns list of matches."""
errors = []
for pattern in SANITIZER_PATTERNS:
matches = pattern.findall(output)
if matches:
errors.extend(matches)
return errors
def run_test(test_path, verbose=False, timeout=DEFAULT_TIMEOUT,
sanitizer_mode=False, valgrind_mode=False):
"""Run a single test and return (passed, duration, output, sanitizer_errors)."""
start = time.time()
# Clean any existing screenshots
for png in BUILD_DIR.glob("test_*.png"):
png.unlink()
# Set up environment with library path
env = os.environ.copy()
existing_ld = env.get('LD_LIBRARY_PATH', '')
env['LD_LIBRARY_PATH'] = f"{LIB_DIR}:{existing_ld}" if existing_ld else str(LIB_DIR)
# Build the command
cmd = []
valgrind_log = None
if valgrind_mode:
valgrind_log = BUILD_DIR / f"valgrind-{test_path.stem}.log"
supp_file = TESTS_DIR.parent / "sanitizers" / "valgrind-mcrf.supp"
cmd.extend([
'valgrind',
'--tool=memcheck',
'--leak-check=full',
'--error-exitcode=42',
f'--log-file={valgrind_log}',
])
if supp_file.exists():
cmd.append(f'--suppressions={supp_file}')
cmd.extend([str(MCROGUEFACE), '--headless', '--exec', str(test_path)])
try:
result = subprocess.run(
cmd,
capture_output=True,
text=True,
timeout=timeout,
cwd=str(BUILD_DIR),
env=env
)
duration = time.time() - start
passed = result.returncode == 0
output = result.stdout + result.stderr
# Check for PASS/FAIL in output
if 'FAIL' in output and 'PASS' not in output.split('FAIL')[-1]:
passed = False
# Check for sanitizer errors in output
sanitizer_errors = []
if sanitizer_mode:
sanitizer_errors = check_sanitizer_output(output)
if sanitizer_errors:
passed = False
# Check valgrind results
if valgrind_mode:
if result.returncode == 42:
passed = False
if valgrind_log and valgrind_log.exists():
vg_output = valgrind_log.read_text()
# Extract error summary
error_lines = [l for l in vg_output.split('\n')
if 'ERROR SUMMARY' in l or 'definitely lost' in l
or 'Invalid' in l]
sanitizer_errors.extend(error_lines[:5])
output += f"\n--- Valgrind log: {valgrind_log} ---\n"
output += '\n'.join(error_lines)
return passed, duration, output, sanitizer_errors
except subprocess.TimeoutExpired:
return False, timeout, "TIMEOUT", []
except Exception as e:
return False, 0, str(e), []
def find_tests(directory):
"""Find all test files in a directory."""
test_dir = TESTS_DIR / directory
if not test_dir.exists():
return []
return sorted(test_dir.glob("*.py"))
def main():
verbose = '-v' in sys.argv or '--verbose' in sys.argv
show_checksums = '--checksums' in sys.argv
sanitizer_mode = '--sanitizer' in sys.argv
valgrind_mode = '--valgrind' in sys.argv
# Parse --timeout=N
timeout = DEFAULT_TIMEOUT
for arg in sys.argv[1:]:
if arg.startswith('--timeout='):
try:
timeout = int(arg.split('=')[1])
except ValueError:
pass
# Apply timeout multiplier from environment
timeout_multiplier = float(os.environ.get('MCRF_TIMEOUT_MULTIPLIER', '1'))
effective_timeout = timeout * timeout_multiplier
# Determine which directories to test
dirs_to_test = []
for arg in sys.argv[1:]:
if arg in TEST_DIRS:
dirs_to_test.append(arg)
if not dirs_to_test:
dirs_to_test = TEST_DIRS
# Header
mode_str = ""
if sanitizer_mode:
mode_str = f" {YELLOW}[ASan/UBSan]{RESET}"
elif valgrind_mode:
mode_str = f" {YELLOW}[Valgrind]{RESET}"
print(f"{BOLD}McRogueFace Test Runner{RESET}{mode_str}")
print(f"Build: {BUILD_DIR}")
print(f"Testing: {', '.join(dirs_to_test)} (timeout: {effective_timeout:.0f}s)")
print("=" * 60)
results = {'pass': 0, 'fail': 0, 'total_time': 0}
failures = []
for test_dir in dirs_to_test:
tests = find_tests(test_dir)
if not tests:
continue
print(f"\n{BOLD}{test_dir}/{RESET} ({len(tests)} tests)")
for test_path in tests:
test_name = test_path.name
passed, duration, output, san_errors = run_test(
test_path, verbose, effective_timeout,
sanitizer_mode=sanitizer_mode,
valgrind_mode=valgrind_mode
)
results['total_time'] += duration
if passed:
results['pass'] += 1
status = f"{GREEN}PASS{RESET}"
else:
results['fail'] += 1
status = f"{RED}FAIL{RESET}"
failures.append((test_dir, test_name, output, san_errors))
# Get screenshot checksums if any were generated
checksum_str = ""
if show_checksums:
checksums = get_screenshot_checksum(BUILD_DIR)
if checksums:
checksum_str = f" [{', '.join(f'{k}:{v}' for k,v in checksums.items())}]"
# Show sanitizer error indicator
san_str = ""
if san_errors:
san_str = f" {RED}[SANITIZER]{RESET}"
print(f" {status} {test_name} ({duration:.2f}s){checksum_str}{san_str}")
if verbose and not passed:
print(f" Output: {output[:200]}...")
if san_errors:
for err in san_errors[:3]:
print(f" {RED}>> {err}{RESET}")
# Summary
print("\n" + "=" * 60)
total = results['pass'] + results['fail']
pass_rate = (results['pass'] / total * 100) if total > 0 else 0
print(f"{BOLD}Results:{RESET} {results['pass']}/{total} passed ({pass_rate:.1f}%)")
print(f"{BOLD}Time:{RESET} {results['total_time']:.2f}s")
if valgrind_mode:
print(f"{BOLD}Valgrind logs:{RESET} {BUILD_DIR}/valgrind-*.log")
if failures:
print(f"\n{RED}{BOLD}Failures:{RESET}")
for test_dir, test_name, output, san_errors in failures:
print(f" {test_dir}/{test_name}")
if san_errors:
for err in san_errors[:3]:
print(f" {RED}>> {err}{RESET}")
if verbose:
# Show last few lines of output
lines = output.strip().split('\n')[-5:]
for line in lines:
print(f" {line}")
sys.exit(0 if results['fail'] == 0 else 1)
if __name__ == '__main__':
main()