""" 8-point Blackboard ULTRA import recipe audit. Run after extracting your CXP package to a directory containing: imsmanifest.xml res00001.dat ... resNNNNNN.dat csfiles/... Usage: python audit_8point.py /path/to/extracted/package Prints PASS/FAIL for each of the 8 defect classes catalogued in the 2026-05-04 fix marathon. Exit code 0 if all PASS, 1 otherwise. """ import re import os import sys def main(target_dir): files = sorted(p[:-4] for p in os.listdir(target_dir) if p.startswith('res') and p.endswith('.dat')) manifest = open(os.path.join(target_dir, 'imsmanifest.xml'), encoding='utf-8').read() def read(f): return open(os.path.join(target_dir, f + '.dat'), encoding='utf-8', errors='replace').read() results = [] # Defect 1: orphan manifest declarations decls = sorted(set(re.findall(r'identifier="(res[0-9]+)"', manifest))) file_set = set(files) missing = [r for r in decls if r not in file_set] orphan = [f for f in files if f not in decls] results.append(( '1. Orphan manifest decls', not missing and not orphan, f'decls={len(decls)} files={len(files)} missing={len(missing)} orphan={len(orphan)}', )) # Defect 2: retired-tool handlers (journal/blog/wiki) in actual content retired = ['x-bb-journallink', 'x-bb-bloglink', 'x-bb-wikilink'] hits = [] for f in files: # res00010 (or equivalent) is the content-handler registry; skip if f in ('res00009', 'res00010'): continue c = read(f) for h in retired: if h in c and '', '', nc).lstrip() root_match = re.match(r'<([A-Z]+|[a-z]+)\b', nc) if not root_match: continue root = root_match.group(1) if declared == 'course/x-bb-coursemessagefolder' and root != 'COURSEMESSAGEFOLDERS': type_violations.append((f, declared, root)) if declared == 'resource/x-bb-blog' and root != 'BLOG': type_violations.append((f, declared, root)) results.append(( '3. Wrong-type substitution', not type_violations, f'violations={len(type_violations)} {type_violations}', )) # Defect 4: empty leaf content items (refined to skip legitimate empty wrappers) intentionally_empty_handlers = { 'resource/x-bb-folder', 'resource/x-bb-lesson', 'resource/x-bb-asmt-test-link', 'resource/x-bb-asmt-survey-link', 'resource/x-bb-forumlink', 'resource/x-bb-courselink', 'resource/x-bb-externallink', 'resource/x-bb-blti-link', } empty_leaves = [] for f in files: c = read(f) if '' not in c: continue if 'ISFOLDER value="true"' in c: continue if ']', c): continue if 'REFERRER' not in c: continue nc = re.sub(r'\s+', ' ', c) rf = re.search(r']', c): continue if 'REFERRER' not in c: continue nc = re.sub(r'\s+', ' ', c) if not re.search(r'', nc): continue rf_m = re.search(r']*>.*?]', c): continue # Find ISAVAILABLE that the literal-string replace would NOT hit # but the regex would. literal_count = c.count('') regex_count = len(re.findall(r'', c)) if regex_count > literal_count: multiline_misses += (regex_count - literal_count) results.append(( '8. Whitespace-tolerant ISAVAILABLE coverage', multiline_misses == 0, f'multiline_misses={multiline_misses}', )) print('=' * 70) print(f'8-Point Blackboard ULTRA Import Recipe Audit -- {target_dir}') print('=' * 70) all_pass = True for label, ok, detail in results: flag = 'PASS' if ok else 'FAIL' print(f' [{flag}] {label}') print(f' {detail}') if not ok: all_pass = False print() print('Overall:', 'ALL PASS' if all_pass else 'NEEDS WORK') return 0 if all_pass else 1 if __name__ == '__main__': if len(sys.argv) != 2: print('Usage: python audit_8point.py /path/to/extracted/package') sys.exit(2) sys.exit(main(sys.argv[1]))