refactor: clear, consistent output for verify and generate_pack

Both tools now count by unique destination (what the user sees on
disk), not by YAML entry or internal check. Same file shared by
multiple systems = counted once. Same file checked for multiple
inner ROMs = counted once with worst-case status.

Output format:
  verify:  "Platform: X/Y files OK, N wrong hash, M missing [mode]"
  pack:    "pack.zip: P files packed, X/Y files OK, N wrong hash [mode]"

X/Y is the same number in both tools for the same platform.
"files packed" differs from "files OK" when data_directories or
EmuDeck MD5-only entries are involved — this is expected and clear
from the numbers (e.g. 34 packed but 161 verified for EmuDeck).
This commit is contained in:
Abdessamad Derraz
2026-03-19 09:06:00 +01:00
parent 866ee40209
commit a88a452469
2 changed files with 80 additions and 72 deletions

View File

@@ -288,24 +288,25 @@ def generate_pack(
os.makedirs(output_dir, exist_ok=True)
total_files = 0
total_checks = 0
verified_checks = 0
missing_files = []
untested_files = []
user_provided = []
seen_destinations = set()
# Per-file status: worst status wins (missing > wrong_hash > ok)
file_status: dict[str, str] = {}
file_reasons: dict[str, str] = {}
with zipfile.ZipFile(zip_path, "w", zipfile.ZIP_DEFLATED) as zf:
for sys_id, system in sorted(config.get("systems", {}).items()):
for file_entry in system.get("files", []):
total_checks += 1
dest = _sanitize_path(file_entry.get("destination", file_entry["name"]))
if not dest:
# EmuDeck-style entries (system:md5 whitelist, no filename).
# Count as verified if file exists in DB by MD5.
fkey = f"{sys_id}/{file_entry.get('name', '')}"
md5 = file_entry.get("md5", "")
if md5 and md5 in db.get("indexes", {}).get("by_md5", {}):
verified_checks += 1
file_status.setdefault(fkey, "ok")
else:
file_status[fkey] = "missing"
continue
if base_dest:
full_dest = f"{base_dest}/{dest}"
@@ -321,7 +322,7 @@ def generate_pack(
if already_packed:
continue
seen_destinations.add(dedup_key)
verified_checks += 1
file_status.setdefault(dedup_key, "ok")
instructions = file_entry.get("instructions", "Please provide this file manually.")
instr_name = f"INSTRUCTIONS_{file_entry['name']}.txt"
instr_path = f"{base_dest}/{instr_name}" if base_dest else instr_name
@@ -355,24 +356,26 @@ def generate_pack(
if status == "not_found":
if not already_packed:
missing_files.append(file_entry["name"])
file_status[dedup_key] = "missing"
continue
check_passed = True
if status == "hash_mismatch":
if verification_mode != "existence":
zf_name = file_entry.get("zipped_file")
if zf_name and local_path:
from verify import check_inside_zip
inner_md5 = file_entry.get("md5", "")
result = check_inside_zip(local_path, zf_name, inner_md5)
if result != "ok":
untested_files.append(file_entry["name"])
check_passed = False
if status == "hash_mismatch" and verification_mode != "existence":
zf_name = file_entry.get("zipped_file")
if zf_name and local_path:
from verify import check_inside_zip
inner_md5 = file_entry.get("md5", "")
inner_result = check_inside_zip(local_path, zf_name, inner_md5)
if inner_result != "ok":
file_status[dedup_key] = "wrong_hash"
reason = f"{zf_name} hash mismatch inside ZIP"
file_reasons[dedup_key] = reason
else:
untested_files.append(file_entry["name"])
check_passed = False
if check_passed:
verified_checks += 1
file_status.setdefault(dedup_key, "ok")
else:
file_status[dedup_key] = "wrong_hash"
file_reasons[dedup_key] = "container hash mismatch"
else:
file_status.setdefault(dedup_key, "ok")
if already_packed:
continue
@@ -436,27 +439,23 @@ def generate_pack(
zf.write(src, full)
total_files += 1
if missing_files:
print(f" Missing ({len(missing_files)}): {', '.join(missing_files[:10])}")
if len(missing_files) > 10:
print(f" ... and {len(missing_files) - 10} more")
files_ok = sum(1 for s in file_status.values() if s == "ok")
files_wrong = sum(1 for s in file_status.values() if s == "wrong_hash")
files_miss = sum(1 for s in file_status.values() if s == "missing")
total_checked = len(file_status)
if untested_files:
print(f" Untested ({len(untested_files)}): {', '.join(untested_files[:10])}")
if len(untested_files) > 10:
print(f" ... and {len(untested_files) - 10} more")
parts = [f"{files_ok}/{total_checked} files OK"]
if files_wrong:
parts.append(f"{files_wrong} wrong hash")
if files_miss:
parts.append(f"{files_miss} missing")
extras_msg = f", {extra_count} extras" if extra_count else ""
print(f" {zip_path}: {total_files} files packed{extras_msg}, {', '.join(parts)} [{verification_mode}]")
if user_provided:
print(f" User-provided ({len(user_provided)}): {', '.join(user_provided)}")
extras_msg = f" + {extra_count} emulator extras" if extra_count else ""
if verification_mode == "existence":
print(f" Generated {zip_path}: {total_files} files ({total_files - extra_count} platform{extras_msg}, {len(missing_files)} missing) [verification: existence]")
else:
checks_detail = ""
if total_checks != total_files:
checks_detail = f" ({total_checks - total_files} duplicate/inner checks)"
print(f" Generated {zip_path}: {total_files} files, {verified_checks}/{total_checks} checks verified{checks_detail}, {len(untested_files)} untested, {len(missing_files)} missing [verification: {verification_mode}]")
for key, reason in file_reasons.items():
print(f" WRONG HASH: {key} {reason}")
for name in missing_files:
print(f" MISSING: {name}")
return zip_path

View File

@@ -203,6 +203,7 @@ def verify_platform(config: dict, db: dict) -> dict:
zip_contents = _build_zip_contents_index(db) if has_zipped else {}
results = []
file_status: dict[str, str] = {}
for sys_id, system in config.get("systems", {}).items():
for file_entry in system.get("files", []):
local_path, resolve_status = resolve_to_local_path(
@@ -215,24 +216,30 @@ def verify_platform(config: dict, db: dict) -> dict:
result["system"] = sys_id
results.append(result)
ok = sum(1 for r in results if r["status"] == Status.OK)
untested = sum(1 for r in results if r["status"] == Status.UNTESTED)
missing = sum(1 for r in results if r["status"] == Status.MISSING)
# Aggregate by destination (what the user sees on disk)
dest = file_entry.get("destination", file_entry.get("name", ""))
if not dest:
dest = f"{sys_id}/{file_entry.get('name', '')}"
cur = result["status"]
prev = file_status.get(dest)
if prev is None:
file_status[dest] = cur
elif cur == Status.MISSING:
file_status[dest] = Status.MISSING
elif cur == Status.UNTESTED and prev != Status.MISSING:
file_status[dest] = Status.UNTESTED
# Count unique files (by system/destination) for reporting
unique_files = set()
for r in results:
dest = r.get("path") or r["name"]
unique_files.add(dest)
files_ok = sum(1 for s in file_status.values() if s == Status.OK)
files_mismatch = sum(1 for s in file_status.values() if s == Status.UNTESTED)
files_missing = sum(1 for s in file_status.values() if s == Status.MISSING)
return {
"platform": platform,
"verification_mode": mode,
"total": len(results),
"unique_files": len(unique_files),
"ok": ok,
"untested": untested,
"missing": missing,
"total_files": len(file_status),
"files_ok": files_ok,
"files_mismatch": files_mismatch,
"files_missing": files_missing,
"details": results,
}
@@ -266,26 +273,28 @@ def main():
if not args.json:
mode = result["verification_mode"]
uf = result["unique_files"]
total = result["total"]
checks_detail = f" ({total - uf} duplicate/inner checks)" if total != uf else ""
if mode == "existence":
print(f"{result['platform']}: {uf} files, {result['ok']}/{total} checks present{checks_detail}, "
f"{result['missing']} missing [verification: {mode}]")
else:
print(f"{result['platform']}: {uf} files, {result['ok']}/{total} checks verified{checks_detail}, "
f"{result['untested']} untested, {result['missing']} missing [verification: {mode}]")
total = result["total_files"]
ok = result["files_ok"]
mismatch = result["files_mismatch"]
miss = result["files_missing"]
for d in result["details"]:
if d["status"] == Status.UNTESTED:
reason = d.get("reason", "")
if not reason and "expected_md5" in d:
reason = f"expected={d['expected_md5'][:16]}... got={d['actual_md5'][:16]}..."
print(f" UNTESTED: {d['system']}/{d['name']} - {reason}")
parts = [f"{ok}/{total} files OK"]
if mismatch:
parts.append(f"{mismatch} wrong hash")
if miss:
parts.append(f"{miss} missing")
print(f"{result['platform']}: {', '.join(parts)} [{mode}]")
for d in result["details"]:
if d["status"] == Status.MISSING:
print(f" MISSING: {d['system']}/{d['name']}")
for d in result["details"]:
if d["status"] == Status.UNTESTED:
reason = d.get("reason", "")
if not reason and "expected_md5" in d:
reason = f"expected {d['expected_md5'][:12]}… got {d['actual_md5'][:12]}"
print(f" WRONG HASH: {d['system']}/{d['name']}{reason}")
for d in result["details"]:
if d["status"] == Status.MISSING:
print(f" MISSING: {d['system']}/{d['name']}")
if args.json:
for r in all_results.values():