Files
DECNET/tests/intel/test_worker_publish.py
anti 9a7b03700c refactor(intel): migrate AttackerIntel JSON-string columns to native SQLAlchemy JSON
Five list columns (greynoise_tags, abuseipdb_categories, threatfox_threat_types,
threatfox_ioc_types, threatfox_malware_families) and four dict columns
(*_raw) are now Column(JSON) with list/dict type annotations and
default_factory=list/dict. Providers return native Python objects; the
application-layer json.dumps/json.loads round-trip and _decode_json_list
helpers are gone. to_intel_event_payload() reads columns directly.

Also caps pytest xdist at -n 4 and excludes tests/api from norecursedirs
to prevent schemathesis workers from OOM-killing the dev loop.
2026-05-10 09:17:15 -04:00

140 lines
4.4 KiB
Python

"""Intel worker publishes ``attacker.intel.enriched`` per enriched row.
Pins the producer wiring. The worker drains
``repo.get_unenriched_attackers``, calls the providers' ``lookup``,
upserts via ``repo.upsert_attacker_intel``, and publishes
``attacker.intel.enriched`` per row.
"""
from __future__ import annotations
import asyncio
import os
from typing import Any
import pytest
from decnet.bus import topics as _topics
from decnet.bus.fake import FakeBus
from decnet.intel import worker as _iw
from decnet.intel.base import IntelProvider, IntelResult
class _FakeProvider(IntelProvider):
name = "fake"
async def lookup(self, ip: str) -> IntelResult:
return IntelResult(
provider="fake",
column_updates={"fake_classification": "malicious"},
verdict="malicious",
)
class _RepoStub:
def __init__(self, pending: list[dict[str, Any]]) -> None:
self._pending = pending
self._yielded = False
self.upserts: list[dict[str, Any]] = []
async def get_unenriched_attackers(
self, *, limit: int = 100,
) -> list[dict[str, Any]]:
if not self._yielded:
self._yielded = True
return list(self._pending)
return []
async def upsert_attacker_intel(self, row: dict[str, Any]) -> None:
self.upserts.append(row)
@pytest.mark.asyncio
async def test_intel_worker_publishes_intel_enriched(
monkeypatch: pytest.MonkeyPatch,
) -> None:
bus = FakeBus()
await bus.connect()
monkeypatch.setattr(_iw, "get_bus", lambda *_a, **_kw: bus)
captured: list[tuple[str, dict[str, Any]]] = []
sub = bus.subscribe(_topics.attacker(_topics.ATTACKER_INTEL_ENRICHED))
async def drain() -> None:
try:
async with sub:
async for ev in sub:
captured.append((ev.topic, ev.payload))
except Exception:
pass
drain_task = asyncio.create_task(drain())
await asyncio.sleep(0)
repo = _RepoStub([
{"uuid": "att-1", "ip": "192.168.1.5"},
])
shutdown = asyncio.Event()
loop_task = asyncio.create_task(_iw.run_intel_loop(
repo, # type: ignore[arg-type]
poll_interval_secs=0.05, ttl_hours=24,
providers=[_FakeProvider()],
shutdown=shutdown,
))
await asyncio.sleep(0.2)
shutdown.set()
await asyncio.wait_for(loop_task, timeout=2.0)
drain_task.cancel()
await bus.close()
assert len(repo.upserts) == 1
assert len(captured) == 1
topic, payload = captured[0]
assert topic == _topics.attacker(_topics.ATTACKER_INTEL_ENRICHED)
assert payload["attacker_uuid"] == "att-1"
assert payload["attacker_ip"] == "192.168.1.5"
assert payload["aggregate_verdict"] == "malicious"
assert "fake" in payload["providers"]
def test_build_intel_event_payload_projects_taxonomy_fields() -> None:
"""The bus payload carries the per-provider taxonomy fields the
IntelLifter needs (categories, tags, threat_types) as native lists.
"""
row = {
"aggregate_verdict": "malicious",
"abuseipdb_score": 87,
"abuseipdb_categories": [14, 18, 22],
"greynoise_classification": "malicious",
"greynoise_name": "Mirai",
"greynoise_tags": ["ssh_bruteforcer"],
"feodo_listed": True,
"feodo_malware_family": "Emotet",
"threatfox_listed": True,
"threatfox_threat_types": ["botnet_cc"],
"threatfox_ioc_types": ["ip:port"],
"threatfox_malware_families": ["Sliver"],
}
payload = _iw._build_intel_event_payload(
"att-2", "203.0.113.7", row, [_FakeProvider()],
)
assert payload["abuseipdb_categories"] == [14, 18, 22]
assert payload["greynoise_tags"] == ["ssh_bruteforcer"]
assert payload["greynoise_name"] == "Mirai"
assert payload["feodo_malware_family"] == "Emotet"
assert payload["threatfox_threat_types"] == ["botnet_cc"]
assert payload["threatfox_ioc_types"] == ["ip:port"]
assert payload["threatfox_malware_families"] == ["Sliver"]
def test_build_intel_event_payload_tolerates_absent_columns() -> None:
"""A pre-enrichment row should produce a payload with empty lists
rather than raising — the IntelLifter contract is to absorb
absence silently."""
payload = _iw._build_intel_event_payload(
"att-3", "10.0.0.1", {}, [],
)
assert payload["abuseipdb_categories"] == []
assert payload["greynoise_tags"] == []
assert payload["threatfox_threat_types"] == []