ModelHawk/modelhawk.py at main · Pyhroff/ModelHawk · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
#!/usr/bin/env python3
"""
ModelHawk - static malware scanner for serialized ML models.

Detects three attack vectors without executing any payload:

  1. Pickle RCE  (.pkl / .pt / .pth / .ckpt / .bin / .joblib* / .dill)
     PyTorch / sklearn / joblib save with pickle; unpickling executes code.
     ModelHawk disassembles the opcode stream and flags dangerous GLOBAL /
     STACK_GLOBAL imports plus REDUCE / INST invocations.
     * joblib files compressed with zlib/lz4 are reported MEDIUM (opaque
       stream) rather than CRITICAL - decompress manually to confirm.

  2. Unsafe YAML  (.yaml / .yml)
     yaml.load() without SafeLoader executes !!python/object/apply: tags.
     ModelHawk regex-scans for PyYAML Python tags - no yaml library needed.

  3. Numpy object arrays  (.npy / inside .npz)
     np.load(..., allow_pickle=True) on an object-dtype array unpickles each
     element. ModelHawk parses the .npy header; if dtype is object it
     disassembles the embedded pickle.

SAFETY
    ModelHawk only *parses* - it never deserializes or executes anything.
    (Verified by the self-test in tests/.)

Stdlib only. MIT-style use. Built as a portfolio project on AI x security.
"""
from __future__ import annotations

import argparse
import ast
import json
import os
import re
import sys
import zipfile
from dataclasses import dataclass, field
from io import StringIO

import pickletools  # static opcode parser - does NOT deserialize / execute

__version__ = "1.1.0"

SEVERITY_ORDER = {"SAFE": 0, "INFO": 1, "LOW": 2, "MEDIUM": 3, "HIGH": 4, "CRITICAL": 5}

# --------------------------------------------------------------------------- #
# Detection tables
# --------------------------------------------------------------------------- #
# Modules with no legitimate place in a serialized model: they grant code,
# process, or filesystem control. Any reference -> CRITICAL.
# Note: os.system serializes as `nt.system` on Windows and `posix.system` on
# Linux, so the whole os/nt/posix family must be covered.
CRITICAL_MODULES = {
    "os", "nt", "posix",
    "subprocess", "pty", "commands",
    "ctypes", "_ctypes",
    "runpy", "webbrowser", "pdb", "bdb", "code", "timeit",
}
# Capability that is occasionally legitimate but a strong red flag in a model.
HIGH_MODULES = {
    "socket", "shutil", "sys", "importlib", "marshal", "multiprocessing",
    "urllib", "urllib2", "http", "httplib", "ftplib", "telnetlib", "smtplib",
    "requests", "asyncio", "_pickle", "cPickle",
}
# Encoding / indirection helpers - commonly used to *hide* a payload.
MEDIUM_MODULES = {
    "base64", "binascii", "zlib", "bz2", "lzma", "gzip", "codecs",
    "tempfile", "glob", "pathlib", "operator", "functools",
}
# Specific callables that are CRITICAL regardless of their module bucket.
CRITICAL_GLOBALS = {
    "builtins.eval", "builtins.exec", "builtins.compile", "builtins.__import__",
    "builtins.getattr", "builtins.setattr", "builtins.open", "builtins.breakpoint",
    "__builtin__.eval", "__builtin__.exec", "__builtin__.execfile",
    "__builtin__.compile", "__builtin__.__import__", "__builtin__.getattr",
    "__builtin__.open", "__builtin__.apply", "__builtin__.file",
    "importlib.import_module", "importlib._bootstrap._load",
    "operator.attrgetter", "operator.methodcaller",
    "code.InteractiveInterpreter", "code.interact",
}
# Globals that are *expected* in legitimate model pickles -> benign (INFO).
BENIGN_GLOBALS = {
    "collections.OrderedDict", "collections.defaultdict", "collections.Counter",
    "builtins.bytearray", "builtins.bytes", "builtins.complex", "builtins.set",
    "builtins.frozenset", "builtins.slice", "builtins.list", "builtins.dict",
    "builtins.tuple", "builtins.int", "builtins.float", "builtins.str",
    "_codecs.encode", "_codecs.decode",
}
# Module prefixes that are normal ML machinery -> INFO (expected, not alarming).
BENIGN_MODULE_PREFIXES = (
    "torch", "numpy", "collections", "sklearn", "pandas", "scipy", "_codecs",
)

# Opcodes that push a string constant (candidate module/qualname for STACK_GLOBAL).
STRING_PUSH_OPS = {
    "SHORT_BINUNICODE", "BINUNICODE", "BINUNICODE8", "UNICODE",
    "STRING", "SHORT_BINSTRING", "BINSTRING",
}
# Opcodes that invoke a callable / build an object - the execution triggers.
TRIGGER_OPS = {"REDUCE", "INST", "OBJ", "NEWOBJ", "NEWOBJ_EX", "BUILD"}

# Pickle protocol signatures (PROTO opcode 0x80 + protocol byte 2..6).
_PROTO_SIGS = (b"\x80\x02", b"\x80\x03", b"\x80\x04", b"\x80\x05", b"\x80\x06")
_PICKLEISH_NAMES = (".pkl", ".pickle", ".bin", ".pt", ".pth", ".ckpt",
                    ".data", ".joblib", ".dill", ".model")

MODEL_EXTS = {".pkl", ".pickle", ".pt", ".pth", ".bin", ".ckpt", ".joblib",
              ".dill", ".model", ".npz", ".npy", ".yaml", ".yml",
              ".safetensors", ".zip"}

# --------------------------------------------------------------------------- #
# YAML scanning constants
# --------------------------------------------------------------------------- #
# Patterns ordered by severity (most dangerous first). We break after the first
# match per line so a line can produce only one finding.
_YAML_PATTERNS: list[tuple] = [
    (re.compile(rb"!!\s*python/object/apply\s*:([^\s\n]*)"), "CRITICAL",
     "!!python/object/apply executes arbitrary Python callable on yaml.load()"),
    (re.compile(rb"!!\s*python/object/new\s*:([^\s\n]*)"), "CRITICAL",
     "!!python/object/new constructs arbitrary Python class on yaml.load()"),
    (re.compile(rb"!!\s*python/object\s*:([^\s\n]*)"), "HIGH",
     "!!python/object reconstructs Python object on yaml.load()"),
    (re.compile(rb"!!\s*python/module\s*:([^\s\n]*)"), "HIGH",
     "!!python/module imports arbitrary Python module on yaml.load()"),
    (re.compile(rb"!!\s*python/name\s*:([^\s\n]*)"), "MEDIUM",
     "!!python/name resolves arbitrary Python name on yaml.load()"),
    (re.compile(rb"!!\s*python/[a-z]"), "LOW",
     "PyYAML Python tag present — dangerous if loaded without SafeLoader"),
]

# --------------------------------------------------------------------------- #
# Numpy .npy scanning constants
# --------------------------------------------------------------------------- #
_NPY_MAGIC = b"\x93NUMPY"
# All representations of the object dtype in numpy .npy headers.
_NPY_OBJECT_DTYPES = {"|O", "O", "<O", ">O", "=O"}


def classify_global(module: str, name: str):
    """Return (severity, human-readable reason) for an imported global."""
    full = f"{module}.{name}"
    if full in CRITICAL_GLOBALS:
        return "CRITICAL", f"invokes dangerous callable {full}()"
    if module in CRITICAL_MODULES:
        return "CRITICAL", f"imports {full} from '{module}' (code / process / file execution)"
    if full in BENIGN_GLOBALS:
        return "INFO", f"benign constructor {full}"
    if module in HIGH_MODULES:
        return "HIGH", f"imports {full} from '{module}' (network / io / dynamic import)"
    if module in MEDIUM_MODULES:
        return "MEDIUM", f"imports {full} from '{module}' (often used to obfuscate a payload)"
    for prefix in BENIGN_MODULE_PREFIXES:
        if module == prefix or module.startswith(prefix + "."):
            return "INFO", f"expected ML global {full}"
    return "MEDIUM", f"unrecognized import {full} (manual review recommended)"


@dataclass
class Finding:
    severity: str
    opcode: str
    target: str
    reason: str
    pos: int


@dataclass
class StreamReport:
    label: str
    findings: list = field(default_factory=list)
    counts: dict = field(default_factory=dict)
    error: str = None
    data: bytes = field(default=None, repr=False)

    @property
    def severity(self) -> str:
        worst = "SAFE"
        for f in self.findings:
            if SEVERITY_ORDER[f.severity] > SEVERITY_ORDER[worst]:
                worst = f.severity
        # A pickle that won't fully parse may be obfuscated/truncated -> suspicious.
        if self.error and SEVERITY_ORDER[worst] < SEVERITY_ORDER["MEDIUM"]:
            worst = "MEDIUM"
        return "SAFE" if worst == "INFO" else worst


@dataclass
class FileReport:
    path: str
    verdict: str
    streams: list = field(default_factory=list)
    note: str = None


def scan_pickle_bytes(data: bytes, label: str = "<pickle>") -> StreamReport:
    """Disassemble one pickle stream and flag dangerous opcodes. No execution."""
    findings = []
    counts = {"GLOBAL": 0, "STACK_GLOBAL": 0, "REDUCE": 0, "INST": 0,
              "OBJ": 0, "NEWOBJ": 0, "NEWOBJ_EX": 0, "BUILD": 0}
    recent_strings = []  # rolling buffer to resolve STACK_GLOBAL's (module, qualname)
    error = None
    try:
        for opcode, arg, pos in pickletools.genops(data):
            nm = opcode.name

            if nm in STRING_PUSH_OPS and isinstance(arg, str):
                recent_strings.append(arg)
                if len(recent_strings) > 8:
                    recent_strings.pop(0)

            if nm == "GLOBAL":
                counts["GLOBAL"] += 1
                module, _, gname = (arg or "").partition(" ")
                sev, reason = classify_global(module, gname)
                findings.append(Finding(sev, "GLOBAL", f"{module}.{gname}", reason, pos))

            elif nm == "STACK_GLOBAL":
                counts["STACK_GLOBAL"] += 1
                if len(recent_strings) >= 2:
                    module, gname = recent_strings[-2], recent_strings[-1]
                else:
                    module, gname = "<unknown>", "<unknown>"
                sev, reason = classify_global(module, gname)
                findings.append(Finding(sev, "STACK_GLOBAL", f"{module}.{gname}", reason, pos))

            elif nm == "INST" and arg:
                counts["INST"] += 1
                module, _, gname = arg.partition(" ")
                sev, reason = classify_global(module, gname)
                findings.append(Finding(sev, "INST", f"{module}.{gname}", reason, pos))

            elif nm in counts:
                counts[nm] += 1
    except Exception as exc:  # truncated / obfuscated / not actually a pickle
        error = f"{type(exc).__name__}: {exc}"
    return StreamReport(label, findings, counts, error, data)


def _looks_like_pickle(head: bytes) -> bool:
    return head[:2] in _PROTO_SIGS


def _is_safetensors(path: str) -> bool:
    """safetensors = <u64 little-endian header length><JSON header><tensor bytes>."""
    try:
        with open(path, "rb") as f:
            head = f.read(9)
        if len(head) < 9:
            return False
        n = int.from_bytes(head[:8], "little")
        size = os.path.getsize(path)
        return 0 < n < size and head[8:9] == b"{"
    except OSError:
        return False


# --------------------------------------------------------------------------- #
# YAML scanning
# --------------------------------------------------------------------------- #

def scan_yaml_bytes(data: bytes, label: str = "<yaml>") -> "StreamReport":
    """Scan YAML content for dangerous PyYAML tags. Regex only — no execution."""
    findings = []
    counts: dict[str, int] = {"YAML_TAG": 0}
    error = None
    try:
        for lineno, line in enumerate(data.splitlines(), 1):
            for pattern, severity, reason in _YAML_PATTERNS:
                m = pattern.search(line)
                if m:
                    target_b = m.group(1) if m.lastindex else b""
                    target = target_b.decode("utf-8", errors="replace").strip() or "<tag>"
                    findings.append(Finding(severity, "YAML_TAG", target, reason, lineno))
                    counts["YAML_TAG"] += 1
                    break  # one finding per line; highest-severity first
    except Exception as exc:
        error = f"{type(exc).__name__}: {exc}"
    return StreamReport(label, findings, counts, error, data)


# --------------------------------------------------------------------------- #
# Numpy .npy scanning
# --------------------------------------------------------------------------- #

def _parse_npy_header(data: bytes) -> tuple[str, int]:
    """Return (dtype_str, data_start_offset). Raises ValueError on bad files."""
    if not data.startswith(_NPY_MAGIC):
        raise ValueError("missing numpy .npy magic bytes")
    major = data[6]
    if major == 1:
        header_len = int.from_bytes(data[8:10], "little")
        hdr_start, data_start = 10, 10 + header_len
    else:  # v2+: 4-byte header length field
        header_len = int.from_bytes(data[8:12], "little")
        hdr_start, data_start = 12, 12 + header_len
    raw_hdr = data[hdr_start:data_start]
    header = ast.literal_eval(raw_hdr.decode("latin-1").strip().rstrip("\x00").rstrip())
    return header.get("descr", ""), data_start


def _npy_extract_pickle(data: bytes):
    """Return embedded pickle bytes if .npy has object dtype, else None."""
    try:
        dtype_str, data_start = _parse_npy_header(data)
        if dtype_str in _NPY_OBJECT_DTYPES:
            return data[data_start:]
    except Exception:
        pass
    return None


def scan_npy_bytes(data: bytes, label: str = "<npy>") -> "StreamReport":
    """Scan a .npy file. Object-dtype arrays embed pickle elements; we scan them."""
    try:
        dtype_str, data_start = _parse_npy_header(data)
    except Exception as exc:
        return StreamReport(label, [], {}, f"npy header parse error: {exc}", data)

    if dtype_str not in _NPY_OBJECT_DTYPES:
        return StreamReport(label, [
            Finding("INFO", "NPY_DTYPE", dtype_str,
                    f"numeric array (dtype={dtype_str}) — no pickle, no code-execution path", 0)
        ], {"NPY_DTYPE": 1}, None, None)

    pickle_data = data[data_start:]
    if not pickle_data:
        return StreamReport(label, [
            Finding("INFO", "NPY_OBJECT", dtype_str,
                    "object array with no data — nothing to scan", 0)
        ], {}, None, data)

    stream = scan_pickle_bytes(pickle_data, f"{label}[object-array]")
    if not stream.findings:
        stream.findings.append(
            Finding("INFO", "NPY_OBJECT", dtype_str,
                    f"object array (dtype={dtype_str}) uses pickle — benign content", 0)
        )
    return stream


def iter_pickle_streams(path: str):
    """Yield (label, bytes) for each pickle stream in a file or zip container."""
    if zipfile.is_zipfile(path):
        try:
            with zipfile.ZipFile(path) as z:
                for info in z.infolist():
                    if info.is_dir():
                        continue
                    raw = z.read(info)
                    name_lower = info.filename.lower()
                    if name_lower.endswith(_PICKLEISH_NAMES) or _looks_like_pickle(raw):
                        yield info.filename, raw
                    elif name_lower.endswith(".npy") and raw.startswith(_NPY_MAGIC):
                        # .npy inside .npz: extract pickle if object dtype
                        pkl = _npy_extract_pickle(raw)
                        if pkl is not None:
                            yield f"{info.filename}[object-array]", pkl
        except zipfile.BadZipFile:
            return
        return
    with open(path, "rb") as f:
        yield "<pickle>", f.read()


def scan_file(path: str) -> FileReport:
    ext = os.path.splitext(path)[1].lower()
    if ext == ".safetensors" or _is_safetensors(path):
        return FileReport(path, "SAFE", [],
                          note="safetensors format — no pickle, no code-execution path")
    if ext in (".yaml", ".yml"):
        try:
            with open(path, "rb") as f:
                stream = scan_yaml_bytes(f.read())
            return FileReport(path, stream.severity, [stream])
        except OSError as exc:
            return FileReport(path, "UNKNOWN", [], note=str(exc))
    if ext == ".npy":
        try:
            with open(path, "rb") as f:
                stream = scan_npy_bytes(f.read())
            return FileReport(path, stream.severity, [stream])
        except OSError as exc:
            return FileReport(path, "UNKNOWN", [], note=str(exc))
    streams = [scan_pickle_bytes(data, label) for label, data in iter_pickle_streams(path)]
    if not streams:
        return FileReport(path, "UNKNOWN", [], note="no pickle stream found")
    verdict = "SAFE"
    for s in streams:
        if SEVERITY_ORDER[s.severity] > SEVERITY_ORDER[verdict]:
            verdict = s.severity
    return FileReport(path, verdict, streams)


def gather_paths(paths):
    out = []
    for p in paths:
        if os.path.isdir(p):
            for root, _dirs, files in os.walk(p):
                for fn in files:
                    if os.path.splitext(fn)[1].lower() in MODEL_EXTS:
                        out.append(os.path.join(root, fn))
        elif os.path.isfile(p):
            out.append(p)
        else:
            print(f"warning: path not found: {p}", file=sys.stderr)
    return sorted(out)


# --------------------------------------------------------------------------- #
# Reporting
# --------------------------------------------------------------------------- #
COLORS = {
    "SAFE": "\033[32m", "INFO": "\033[36m", "LOW": "\033[36m", "MEDIUM": "\033[33m",
    "HIGH": "\033[35m", "CRITICAL": "\033[31;1m", "UNKNOWN": "\033[90m",
    "RESET": "\033[0m", "DIM": "\033[2m",
}
ICONS = {
    "SAFE": "[ OK ]", "INFO": "[INFO]", "LOW": "[ LOW]", "MEDIUM": "[WARN]",
    "HIGH": "[HIGH]", "CRITICAL": "[!!!!]", "UNKNOWN": "[ ?? ]",
}


def _enable_windows_ansi():
    if os.name != "nt":
        return
    try:
        import ctypes
        kernel32 = ctypes.windll.kernel32
        # ENABLE_PROCESSED_OUTPUT | ENABLE_WRAP_AT_EOL_OUTPUT | ENABLE_VIRTUAL_TERMINAL_PROCESSING
        kernel32.SetConsoleMode(kernel32.GetStdHandle(-11), 7)
    except Exception:
        pass


def _paint(text, sev, use_color):
    if not use_color:
        return text
    return f"{COLORS.get(sev, '')}{text}{COLORS['RESET']}"


def _worst_finding(rep: FileReport):
    worst = None
    for s in rep.streams:
        for f in s.findings:
            if worst is None or SEVERITY_ORDER[f.severity] > SEVERITY_ORDER[worst.severity]:
                worst = f
    return worst


def _triggers(rep: FileReport):
    trig = set()
    for s in rep.streams:
        for op, c in s.counts.items():
            if c and op in TRIGGER_OPS:
                trig.add(op)
    return trig


def file_headline(rep: FileReport) -> str:
    worst = _worst_finding(rep)
    if worst is None:
        return rep.note or "no findings"
    trig = _triggers(rep)
    if trig and SEVERITY_ORDER[worst.severity] >= SEVERITY_ORDER["HIGH"]:
        return f"{'/'.join(sorted(trig))} -> {worst.target}   ({worst.reason})"
    return worst.reason


def _banner(use_color):
    art = (
        "  __  __         _     _ _  _              _    \n"
        " |  \\/  |___  __| |___| | || |__ ___ __ __| |__ \n"
        " | |\\/| / _ \\/ _` / -_) | __ / _` \\ V  V / / /  \n"
        " |_|  |_\\___/\\__,_\\___|_|_||_\\__,_|\\_/\\_/|_\\_\\  \n"
        "        static pickle-RCE scanner for ML models\n"
    )
    print(_paint(art, "CRITICAL", use_color))


def print_reports(reports, use_color=True, disasm=False, quiet=False):
    for rep in reports:
        flagged = rep.verdict not in ("SAFE", "UNKNOWN")
        if quiet and not flagged:
            continue
        icon = ICONS.get(rep.verdict, "[ ?? ]")
        print(_paint(f"{icon} {rep.verdict:8} {rep.path}", rep.verdict, use_color))
        if flagged:
            print(_paint(f"        |- {file_headline(rep)}", rep.verdict, use_color))
            for s in rep.streams:
                evidence = "  ".join(f"{k}x{v}" for k, v in s.counts.items() if v)
                if evidence:
                    label = "" if s.label == "<pickle>" else f" [{s.label}]"
                    print(_paint(f"           opcodes{label}: {evidence}", "DIM", use_color))
                if s.error:
                    print(_paint(f"           parse error: {s.error}", "DIM", use_color))
            if disasm:
                for s in rep.streams:
                    if s.data is None:
                        continue
                    print(_paint(f"        -- opcode disassembly [{s.label}] --", "DIM", use_color))
                    out = StringIO()
                    try:
                        pickletools.dis(s.data, out)  # static; does not execute
                        print(out.getvalue())
                    except Exception as exc:
                        print(f"           (disasm failed: {exc})")
        elif rep.note:
            print(_paint(f"        |- {rep.note}", rep.verdict, use_color))


def _summary(reports, use_color):
    tally = {}
    for r in reports:
        tally[r.verdict] = tally.get(r.verdict, 0) + 1
    parts = [f"{k}:{v}" for k, v in sorted(tally.items(), key=lambda kv: -SEVERITY_ORDER.get(kv[0], 0))]
    print(_paint(f"\nscanned {len(reports)} file(s)  ->  " + "  ".join(parts), "DIM", use_color))


def report_to_dict(rep: FileReport):
    return {
        "path": rep.path,
        "verdict": rep.verdict,
        "note": rep.note,
        "streams": [
            {
                "label": s.label,
                "severity": s.severity,
                "error": s.error,
                "counts": {k: v for k, v in s.counts.items() if v},
                "findings": [
                    {"severity": f.severity, "opcode": f.opcode,
                     "target": f.target, "reason": f.reason, "pos": f.pos}
                    for f in s.findings
                ],
            }
            for s in rep.streams
        ],
    }


def main(argv=None):
    ap = argparse.ArgumentParser(
        prog="modelhawk",
        description="Static scanner for malicious ML model files (pickle RCE). "
                    "Disassembles pickle opcodes - never executes the model.",
    )
    ap.add_argument("paths", nargs="+", help="model file(s) or directory(ies) to scan")
    ap.add_argument("--json", action="store_true", help="machine-readable JSON output")
    ap.add_argument("--disasm", action="store_true",
                    help="print the pickle opcode disassembly for flagged files")
    ap.add_argument("--no-color", action="store_true", help="disable ANSI colors")
    ap.add_argument("-q", "--quiet", action="store_true", help="only print flagged files")
    ap.add_argument("--fail-on", default="HIGH", choices=list(SEVERITY_ORDER),
                    help="exit non-zero if any file is at/above this severity (default: HIGH)")
    ap.add_argument("--version", action="version", version=f"ModelHawk {__version__}")
    args = ap.parse_args(argv)

    use_color = (not args.no_color) and sys.stdout.isatty() and not args.json
    if use_color:
        _enable_windows_ansi()

    files = gather_paths(args.paths)
    reports = [scan_file(p) for p in files]

    if args.json:
        print(json.dumps([report_to_dict(r) for r in reports], indent=2))
    else:
        if not args.quiet:
            _banner(use_color)
        print_reports(reports, use_color=use_color, disasm=args.disasm, quiet=args.quiet)
        _summary(reports, use_color)

    threshold = SEVERITY_ORDER[args.fail_on]
    worst = max((SEVERITY_ORDER[r.verdict] for r in reports if r.verdict in SEVERITY_ORDER),
                default=0)
    return 1 if worst >= threshold else 0


if __name__ == "__main__":
    sys.exit(main())