feat(profiler/behave_shell): G.5 emotional_valence.valence

Soft primitive — pure ratio over G.0 lexical counters:

* positive — positive_lex_hits > negative + obscenity, ≥ VALENCE_MIN_HITS
* negative — (negative + obscenity) > positive, sum ≥ VALENCE_MIN_HITS
* neutral  — fall-through

Skip below VALENCE_MIN_TYPED_CHARS (80). Confidence hard-capped at
EMOTIONAL_VALENCE_CONFIDENCE_CAP (0.5) inside the feature function;
0.30 below VALENCE_FULL_CONFIDENCE_MIN (200). Cap is registry
convention.
This commit is contained in:
2026-05-08 16:34:27 -04:00
parent acf8382bcf
commit 3ba7e22b71
3 changed files with 137 additions and 0 deletions

View File

@@ -0,0 +1,68 @@
"""Step G.5: ``emotional_valence.valence`` ∈ {positive, neutral, negative}.
Hard 0.5 confidence cap.
"""
from __future__ import annotations
from decnet.profiler.behave_shell import extract_session
from decnet.profiler.behave_shell._parse import AsciinemaEvent
PRIMITIVE = "emotional_valence.valence"
def _of(observations: list, primitive: str):
obs = [o for o in observations if o.primitive == primitive]
assert len(obs) == 1, f"expected exactly one {primitive}, got {len(obs)}"
return obs[0]
def _typed(text: str, t0: float = 0.0, dt: float = 0.05) -> list[AsciinemaEvent]:
return [(t0 + i * dt, "i", c) for i, c in enumerate(text)]
def test_too_little_text_no_emission() -> None:
out = list(extract_session(_typed("hi"), sid="g5-thin"))
assert [o for o in out if o.primitive == PRIMITIVE] == []
def test_positive_valence() -> None:
text = (
"thanks great nice perfect awesome love thanks great nice perfect "
"this is going perfectly well today thanks "
)
obs = _of(list(extract_session(_typed(text), sid="g5-pos")), PRIMITIVE)
assert obs.value == "positive"
assert obs.confidence <= 0.50
def test_negative_valence_via_obscenity_and_negatives() -> None:
text = (
"fuck this is broken damn it stuck here wtf fuck shit "
"everything is broken and stupid today again broken again "
"wrong wrong wrong total disaster here and now "
)
obs = _of(list(extract_session(_typed(text), sid="g5-neg")), PRIMITIVE)
assert obs.value == "negative"
assert obs.confidence <= 0.50
def test_neutral_valence_when_no_lexicon_hits() -> None:
text = (
"running command for inspection of remote system today "
"checking files and verifying things look correct overall "
)
obs = _of(list(extract_session(_typed(text), sid="g5-neutral")), PRIMITIVE)
assert obs.value == "neutral"
def test_confidence_hard_capped_at_05() -> None:
text = "thanks " * 50 # plenty positive, plenty long
obs = _of(list(extract_session(_typed(text), sid="g5-cap")), PRIMITIVE)
assert obs.confidence <= 0.50
def test_low_text_count_lower_confidence() -> None:
text = "thanks great nice perfect awesome love " * 3
obs = _of(list(extract_session(_typed(text), sid="g5-lowconf")), PRIMITIVE)
assert obs.confidence == 0.30