Four-part fix for the collection bottleneck that was blocking the dev loop: 1. Lazy mitreattack.stix20 import in attack_stix.py — deferred to first _load() call (TYPE_CHECKING guard at top level) 2. Lazy misp_stix_converter import in both MISP export routers — moved from module level into the route handler body 3. Lazy attack_catalog / attack_stix in ttp.py repo mixin — thin wrapper functions so the import chain never fires at module load time 4. tests/api/conftest.py — `from decnet.web.api import app` moved inside the `client()` fixture; `pytest_ignore_collect` broadened to skip all test_schemathesis*.py variants (not just test_schemathesis.py), which were launching a subprocess server at module-import time 5. pyproject.toml — `norecursedirs` for tests/live, tests/stress, tests/service_testing, tests/docker, tests/perf so these directories are never entered; `-m` filter removed from addopts (now redundant); `--dist loadscope` → `--dist load` to unblock workers immediately 6. behave_core / behave_shell rename — BEHAVE packages dropped the `decnet_` prefix; reinstalled editable installs and updated all 14 import sites across profiler, ttp, bus, and correlation modules
219 lines
7.4 KiB
Python
219 lines
7.4 KiB
Python
"""``operational.*`` feature functions (Phase G).
|
|
|
|
Step G.1: ``operational.objective``.
|
|
Step G.2: ``operational.opsec_discipline`` (lands later).
|
|
Step G.3: ``operational.cleanup_behavior`` (lands later).
|
|
Step G.4: ``operational.multi_actor_indicators`` (lands later).
|
|
"""
|
|
from __future__ import annotations
|
|
|
|
import collections
|
|
import statistics
|
|
from typing import Iterator
|
|
|
|
from behave_core.spec.envelope import Observation
|
|
|
|
from decnet.profiler.behave_shell._ctx import SessionContext
|
|
from decnet.profiler.behave_shell._features._emit import make_observation
|
|
from decnet.profiler.behave_shell._features.temporal import (
|
|
_CLEANUP_TOKEN_HASHES,
|
|
)
|
|
from decnet.profiler.behave_shell._intent import (
|
|
OPSEC_HISTORY_TOKENS,
|
|
classify_intent,
|
|
)
|
|
from decnet.profiler.behave_shell._thresholds import (
|
|
CLEANUP_TAIL_K,
|
|
CLEANUP_THOROUGH_MIN_DISTINCT,
|
|
EXIT_BEHAVIOR_LOOKBACK_K,
|
|
INTENT_FULL_CONFIDENCE_MIN,
|
|
INTENT_MIN_COMMANDS,
|
|
MIN_COMMANDS_FOR_FULL_CONFIDENCE,
|
|
MULTI_ACTOR_HALF_MIN_COMMANDS,
|
|
MULTI_ACTOR_HANDOFF_DELTA,
|
|
MULTI_ACTOR_MIN_COMMANDS,
|
|
)
|
|
|
|
|
|
def objective(ctx: SessionContext) -> Iterator[Observation]:
|
|
"""Emit ``operational.objective`` ∈ {recon, exfil, persistence,
|
|
lateral, destructive}.
|
|
|
|
Walk every command's ``first_token_hash`` through
|
|
:func:`classify_intent` (fixed precedence:
|
|
``destructive > persistence > exfil > lateral > recon``).
|
|
Commands that don't classify (token not in any set) are skipped —
|
|
the registry has no ``unknown`` value here, so a session of pure
|
|
``vim`` / ``ls`` operations is allowed to fall through and emit
|
|
``recon`` only if at least :data:`INTENT_MIN_COMMANDS` commands
|
|
actually classify.
|
|
|
|
Skip emission when fewer than ``INTENT_MIN_COMMANDS`` classified
|
|
hits — too thin to call. Otherwise majority vote (ties broken by
|
|
precedence order via ``most_common(1)``-stable sort over the
|
|
insertion order, which mirrors the precedence walk).
|
|
|
|
Confidence: 0.40 below :data:`INTENT_FULL_CONFIDENCE_MIN`; 0.60
|
|
above. v0.1 lexicon — corpus tuning revisits in v0.2.
|
|
"""
|
|
if not ctx.commands:
|
|
return
|
|
counter: collections.Counter[str] = collections.Counter()
|
|
for cmd in ctx.commands:
|
|
label = classify_intent(cmd.first_token_hash)
|
|
if label is not None:
|
|
counter[label] += 1
|
|
n_classified = sum(counter.values())
|
|
if n_classified < INTENT_MIN_COMMANDS:
|
|
return
|
|
value = counter.most_common(1)[0][0]
|
|
confidence = 0.60 if n_classified >= INTENT_FULL_CONFIDENCE_MIN else 0.40
|
|
yield make_observation(
|
|
ctx,
|
|
primitive="operational.objective",
|
|
value=value,
|
|
confidence=confidence,
|
|
)
|
|
|
|
|
|
def opsec_discipline(ctx: SessionContext) -> Iterator[Observation]:
|
|
"""Emit ``operational.opsec_discipline`` ∈ {careful, careless, learning}.
|
|
|
|
* ``careful`` — operator hits ``OPSEC_HISTORY_TOKENS`` AND the
|
|
tail-K (=``EXIT_BEHAVIOR_LOOKBACK_K``) commands include cleanup
|
|
vocabulary (locally re-derived; we do **not** read prior
|
|
observations).
|
|
* ``learning`` — operator hits ``OPSEC_HISTORY_TOKENS`` but does
|
|
NOT close with cleanup tokens. Half-discipline.
|
|
* ``careless`` — no ``OPSEC_HISTORY_TOKENS`` hits at all.
|
|
|
|
Skip emission when no commands. Confidence 0.45 (small lexicon,
|
|
soft); 0.30 below ``MIN_COMMANDS_FOR_FULL_CONFIDENCE`` (=5).
|
|
"""
|
|
if not ctx.commands:
|
|
return
|
|
has_history = any(
|
|
c.first_token_hash in OPSEC_HISTORY_TOKENS for c in ctx.commands
|
|
)
|
|
tail = ctx.commands[-EXIT_BEHAVIOR_LOOKBACK_K:]
|
|
has_cleanup_tail = any(
|
|
c.first_token_hash in _CLEANUP_TOKEN_HASHES for c in tail
|
|
)
|
|
if not has_history:
|
|
value = "careless"
|
|
elif has_cleanup_tail:
|
|
value = "careful"
|
|
else:
|
|
value = "learning"
|
|
if len(ctx.commands) < MIN_COMMANDS_FOR_FULL_CONFIDENCE:
|
|
confidence = 0.30
|
|
else:
|
|
confidence = 0.45
|
|
yield make_observation(
|
|
ctx,
|
|
primitive="operational.opsec_discipline",
|
|
value=value,
|
|
confidence=confidence,
|
|
)
|
|
|
|
|
|
def cleanup_behavior(ctx: SessionContext) -> Iterator[Observation]:
|
|
"""Emit ``operational.cleanup_behavior`` ∈ {thorough, partial, none}.
|
|
|
|
Inspect the last ``CLEANUP_TAIL_K`` (=5) commands. Count distinct
|
|
cleanup-family hashes (``history`` / ``unset`` / ``rm`` / ``shred``
|
|
/ ``clear`` / ``kill``) in that window:
|
|
|
|
* ``thorough`` — ≥ ``CLEANUP_THOROUGH_MIN_DISTINCT`` (3) distinct
|
|
cleanup tokens.
|
|
* ``partial`` — 1-2 distinct cleanup tokens.
|
|
* ``none`` — zero hits.
|
|
|
|
Adjacent to E.4's ``exit_behavior=cleanup`` emission — E.4 is
|
|
binary "did it happen", G.3 graduates intensity. Both ride.
|
|
|
|
Skip emission when no commands. Confidence 0.55 when commands ≥ 8;
|
|
0.35 below.
|
|
"""
|
|
if not ctx.commands:
|
|
return
|
|
tail = ctx.commands[-CLEANUP_TAIL_K:]
|
|
distinct = {
|
|
c.first_token_hash for c in tail
|
|
if c.first_token_hash in _CLEANUP_TOKEN_HASHES
|
|
}
|
|
if len(distinct) >= CLEANUP_THOROUGH_MIN_DISTINCT:
|
|
value = "thorough"
|
|
elif len(distinct) >= 1:
|
|
value = "partial"
|
|
else:
|
|
value = "none"
|
|
confidence = 0.55 if len(ctx.commands) >= 8 else 0.35
|
|
yield make_observation(
|
|
ctx,
|
|
primitive="operational.cleanup_behavior",
|
|
value=value,
|
|
confidence=confidence,
|
|
)
|
|
|
|
|
|
def multi_actor_indicators(ctx: SessionContext) -> Iterator[Observation]:
|
|
"""Emit ``operational.multi_actor_indicators`` ∈ {solo, handoff_detected}.
|
|
|
|
Compare first-half vs second-half typing rhythm. ``team_coordinated``
|
|
is **never** emitted from a single session — it's Tier B and lands
|
|
in the attribution engine.
|
|
|
|
Algorithm:
|
|
* Split commands at the temporal midpoint
|
|
(``t_start + duration_s / 2``).
|
|
* Flatten ``ctx.intra_command_iats`` per half.
|
|
* If both halves have ≥ ``MULTI_ACTOR_HALF_MIN_COMMANDS`` (4)
|
|
commands AND
|
|
``abs(median_a - median_b) / max(median_a, median_b)`` >
|
|
``MULTI_ACTOR_HANDOFF_DELTA`` (0.5) → ``handoff_detected``.
|
|
* Else → ``solo``.
|
|
|
|
Skip emission when fewer than ``MULTI_ACTOR_MIN_COMMANDS`` (8)
|
|
total. Confidence 0.40 (single-session is a weak handoff signal);
|
|
0.55 when both halves are ≥ 8 commands.
|
|
"""
|
|
n = len(ctx.commands)
|
|
if n < MULTI_ACTOR_MIN_COMMANDS:
|
|
return
|
|
midpoint = ctx.t_start + ctx.duration_s / 2.0
|
|
a_iats: list[float] = []
|
|
b_iats: list[float] = []
|
|
a_count = 0
|
|
b_count = 0
|
|
for cmd, iats in zip(ctx.commands, ctx.intra_command_iats):
|
|
if cmd.start_ts < midpoint:
|
|
a_iats.extend(iats)
|
|
a_count += 1
|
|
else:
|
|
b_iats.extend(iats)
|
|
b_count += 1
|
|
if a_count < MULTI_ACTOR_HALF_MIN_COMMANDS or b_count < MULTI_ACTOR_HALF_MIN_COMMANDS:
|
|
value = "solo"
|
|
elif not a_iats or not b_iats:
|
|
value = "solo"
|
|
else:
|
|
median_a = statistics.median(a_iats)
|
|
median_b = statistics.median(b_iats)
|
|
denom = max(median_a, median_b)
|
|
if denom > 0.0:
|
|
delta = abs(median_a - median_b) / denom
|
|
value = "handoff_detected" if delta > MULTI_ACTOR_HANDOFF_DELTA else "solo"
|
|
else:
|
|
value = "solo"
|
|
if a_count >= 8 and b_count >= 8:
|
|
confidence = 0.55
|
|
else:
|
|
confidence = 0.40
|
|
yield make_observation(
|
|
ctx,
|
|
primitive="operational.multi_actor_indicators",
|
|
value=value,
|
|
confidence=confidence,
|
|
)
|