feat(profiler/behave_shell): G.5 emotional_valence.valence
Soft primitive — pure ratio over G.0 lexical counters: * positive — positive_lex_hits > negative + obscenity, ≥ VALENCE_MIN_HITS * negative — (negative + obscenity) > positive, sum ≥ VALENCE_MIN_HITS * neutral — fall-through Skip below VALENCE_MIN_TYPED_CHARS (80). Confidence hard-capped at EMOTIONAL_VALENCE_CONFIDENCE_CAP (0.5) inside the feature function; 0.30 below VALENCE_FULL_CONFIDENCE_MIN (200). Cap is registry convention.
This commit is contained in:
@@ -0,0 +1,68 @@
|
||||
"""Step G.5: ``emotional_valence.valence`` ∈ {positive, neutral, negative}.
|
||||
|
||||
Hard 0.5 confidence cap.
|
||||
"""
|
||||
from __future__ import annotations
|
||||
|
||||
from decnet.profiler.behave_shell import extract_session
|
||||
from decnet.profiler.behave_shell._parse import AsciinemaEvent
|
||||
|
||||
|
||||
PRIMITIVE = "emotional_valence.valence"
|
||||
|
||||
|
||||
def _of(observations: list, primitive: str):
|
||||
obs = [o for o in observations if o.primitive == primitive]
|
||||
assert len(obs) == 1, f"expected exactly one {primitive}, got {len(obs)}"
|
||||
return obs[0]
|
||||
|
||||
|
||||
def _typed(text: str, t0: float = 0.0, dt: float = 0.05) -> list[AsciinemaEvent]:
|
||||
return [(t0 + i * dt, "i", c) for i, c in enumerate(text)]
|
||||
|
||||
|
||||
def test_too_little_text_no_emission() -> None:
|
||||
out = list(extract_session(_typed("hi"), sid="g5-thin"))
|
||||
assert [o for o in out if o.primitive == PRIMITIVE] == []
|
||||
|
||||
|
||||
def test_positive_valence() -> None:
|
||||
text = (
|
||||
"thanks great nice perfect awesome love thanks great nice perfect "
|
||||
"this is going perfectly well today thanks "
|
||||
)
|
||||
obs = _of(list(extract_session(_typed(text), sid="g5-pos")), PRIMITIVE)
|
||||
assert obs.value == "positive"
|
||||
assert obs.confidence <= 0.50
|
||||
|
||||
|
||||
def test_negative_valence_via_obscenity_and_negatives() -> None:
|
||||
text = (
|
||||
"fuck this is broken damn it stuck here wtf fuck shit "
|
||||
"everything is broken and stupid today again broken again "
|
||||
"wrong wrong wrong total disaster here and now "
|
||||
)
|
||||
obs = _of(list(extract_session(_typed(text), sid="g5-neg")), PRIMITIVE)
|
||||
assert obs.value == "negative"
|
||||
assert obs.confidence <= 0.50
|
||||
|
||||
|
||||
def test_neutral_valence_when_no_lexicon_hits() -> None:
|
||||
text = (
|
||||
"running command for inspection of remote system today "
|
||||
"checking files and verifying things look correct overall "
|
||||
)
|
||||
obs = _of(list(extract_session(_typed(text), sid="g5-neutral")), PRIMITIVE)
|
||||
assert obs.value == "neutral"
|
||||
|
||||
|
||||
def test_confidence_hard_capped_at_05() -> None:
|
||||
text = "thanks " * 50 # plenty positive, plenty long
|
||||
obs = _of(list(extract_session(_typed(text), sid="g5-cap")), PRIMITIVE)
|
||||
assert obs.confidence <= 0.50
|
||||
|
||||
|
||||
def test_low_text_count_lower_confidence() -> None:
|
||||
text = "thanks great nice perfect awesome love " * 3
|
||||
obs = _of(list(extract_session(_typed(text), sid="g5-lowconf")), PRIMITIVE)
|
||||
assert obs.confidence == 0.30
|
||||
Reference in New Issue
Block a user