Five list columns (greynoise_tags, abuseipdb_categories, threatfox_threat_types, threatfox_ioc_types, threatfox_malware_families) and four dict columns (*_raw) are now Column(JSON) with list/dict type annotations and default_factory=list/dict. Providers return native Python objects; the application-layer json.dumps/json.loads round-trip and _decode_json_list helpers are gone. to_intel_event_payload() reads columns directly. Also caps pytest xdist at -n 4 and excludes tests/api from norecursedirs to prevent schemathesis workers from OOM-killing the dev loop.
140 lines
4.4 KiB
Python
140 lines
4.4 KiB
Python
"""Intel worker publishes ``attacker.intel.enriched`` per enriched row.
|
|
|
|
Pins the producer wiring. The worker drains
|
|
``repo.get_unenriched_attackers``, calls the providers' ``lookup``,
|
|
upserts via ``repo.upsert_attacker_intel``, and publishes
|
|
``attacker.intel.enriched`` per row.
|
|
"""
|
|
from __future__ import annotations
|
|
|
|
import asyncio
|
|
import os
|
|
from typing import Any
|
|
|
|
import pytest
|
|
|
|
from decnet.bus import topics as _topics
|
|
from decnet.bus.fake import FakeBus
|
|
from decnet.intel import worker as _iw
|
|
from decnet.intel.base import IntelProvider, IntelResult
|
|
|
|
|
|
class _FakeProvider(IntelProvider):
|
|
name = "fake"
|
|
|
|
async def lookup(self, ip: str) -> IntelResult:
|
|
return IntelResult(
|
|
provider="fake",
|
|
column_updates={"fake_classification": "malicious"},
|
|
verdict="malicious",
|
|
)
|
|
|
|
|
|
class _RepoStub:
|
|
def __init__(self, pending: list[dict[str, Any]]) -> None:
|
|
self._pending = pending
|
|
self._yielded = False
|
|
self.upserts: list[dict[str, Any]] = []
|
|
|
|
async def get_unenriched_attackers(
|
|
self, *, limit: int = 100,
|
|
) -> list[dict[str, Any]]:
|
|
if not self._yielded:
|
|
self._yielded = True
|
|
return list(self._pending)
|
|
return []
|
|
|
|
async def upsert_attacker_intel(self, row: dict[str, Any]) -> None:
|
|
self.upserts.append(row)
|
|
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_intel_worker_publishes_intel_enriched(
|
|
monkeypatch: pytest.MonkeyPatch,
|
|
) -> None:
|
|
bus = FakeBus()
|
|
await bus.connect()
|
|
monkeypatch.setattr(_iw, "get_bus", lambda *_a, **_kw: bus)
|
|
|
|
captured: list[tuple[str, dict[str, Any]]] = []
|
|
sub = bus.subscribe(_topics.attacker(_topics.ATTACKER_INTEL_ENRICHED))
|
|
|
|
async def drain() -> None:
|
|
try:
|
|
async with sub:
|
|
async for ev in sub:
|
|
captured.append((ev.topic, ev.payload))
|
|
except Exception:
|
|
pass
|
|
|
|
drain_task = asyncio.create_task(drain())
|
|
await asyncio.sleep(0)
|
|
|
|
repo = _RepoStub([
|
|
{"uuid": "att-1", "ip": "192.168.1.5"},
|
|
])
|
|
shutdown = asyncio.Event()
|
|
|
|
loop_task = asyncio.create_task(_iw.run_intel_loop(
|
|
repo, # type: ignore[arg-type]
|
|
poll_interval_secs=0.05, ttl_hours=24,
|
|
providers=[_FakeProvider()],
|
|
shutdown=shutdown,
|
|
))
|
|
await asyncio.sleep(0.2)
|
|
shutdown.set()
|
|
await asyncio.wait_for(loop_task, timeout=2.0)
|
|
drain_task.cancel()
|
|
await bus.close()
|
|
|
|
assert len(repo.upserts) == 1
|
|
assert len(captured) == 1
|
|
topic, payload = captured[0]
|
|
assert topic == _topics.attacker(_topics.ATTACKER_INTEL_ENRICHED)
|
|
assert payload["attacker_uuid"] == "att-1"
|
|
assert payload["attacker_ip"] == "192.168.1.5"
|
|
assert payload["aggregate_verdict"] == "malicious"
|
|
assert "fake" in payload["providers"]
|
|
|
|
|
|
def test_build_intel_event_payload_projects_taxonomy_fields() -> None:
|
|
"""The bus payload carries the per-provider taxonomy fields the
|
|
IntelLifter needs (categories, tags, threat_types) as native lists.
|
|
"""
|
|
row = {
|
|
"aggregate_verdict": "malicious",
|
|
"abuseipdb_score": 87,
|
|
"abuseipdb_categories": [14, 18, 22],
|
|
"greynoise_classification": "malicious",
|
|
"greynoise_name": "Mirai",
|
|
"greynoise_tags": ["ssh_bruteforcer"],
|
|
"feodo_listed": True,
|
|
"feodo_malware_family": "Emotet",
|
|
"threatfox_listed": True,
|
|
"threatfox_threat_types": ["botnet_cc"],
|
|
"threatfox_ioc_types": ["ip:port"],
|
|
"threatfox_malware_families": ["Sliver"],
|
|
}
|
|
payload = _iw._build_intel_event_payload(
|
|
"att-2", "203.0.113.7", row, [_FakeProvider()],
|
|
)
|
|
assert payload["abuseipdb_categories"] == [14, 18, 22]
|
|
assert payload["greynoise_tags"] == ["ssh_bruteforcer"]
|
|
assert payload["greynoise_name"] == "Mirai"
|
|
assert payload["feodo_malware_family"] == "Emotet"
|
|
assert payload["threatfox_threat_types"] == ["botnet_cc"]
|
|
assert payload["threatfox_ioc_types"] == ["ip:port"]
|
|
assert payload["threatfox_malware_families"] == ["Sliver"]
|
|
|
|
|
|
def test_build_intel_event_payload_tolerates_absent_columns() -> None:
|
|
"""A pre-enrichment row should produce a payload with empty lists
|
|
rather than raising — the IntelLifter contract is to absorb
|
|
absence silently."""
|
|
payload = _iw._build_intel_event_payload(
|
|
"att-3", "10.0.0.1", {}, [],
|
|
)
|
|
assert payload["abuseipdb_categories"] == []
|
|
assert payload["greynoise_tags"] == []
|
|
assert payload["threatfox_threat_types"] == []
|