lisihan
/
content-find-agent-new


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130
							"""config x case matrix (V2-M0E).

Replays the same captured case under different configurations to prove the
"foolproof config" safety net: changing config changes the case outcome,
visibly (snapshot diff), without breaking the pipeline. Variants that depend on
later modules (M3 per-entity dispatch) are xfail until then.
"""

from __future__ import annotations

import json
import shutil
from pathlib import Path

import pytest

from content_agent.integrations.policy_json import JsonPolicyBundleStore
from tests.replay_harness import replay_case
from tests.snapshot import assert_matches

ROOT = Path(__file__).resolve().parents[1]
_RULE_PACK_REL = "product_documents/规则包/douyin_rule_packs.v1.json"
_WALK_REL = "product_documents/抖音游走策略/douyin_walk_strategy.v1.json"


def _senior_block_store(root: Path) -> JsonPolicyBundleStore:
    """M3 config variant: flip the not_fit_senior gate to fire on fit_senior_50plus == true.

    The captured case's mock Gemini judgment marks every item fit (fit_senior_50plus=true),
    so inverting the gate's expected value blocks the whole batch by config alone — a clean
    counterproof that the hard gate (and the downstream walk) is config-driven, not hardcoded.
    """
    (root / _RULE_PACK_REL).parent.mkdir(parents=True, exist_ok=True)
    (root / _WALK_REL).parent.mkdir(parents=True, exist_ok=True)
    shutil.copy(ROOT / _WALK_REL, root / _WALK_REL)
    package = json.loads((ROOT / _RULE_PACK_REL).read_text(encoding="utf-8"))
    for pack in package.get("rule_packs", []):
        for gate in pack.get("hard_gates", []):
            if gate.get("gate_id") == "not_fit_senior":
                gate["when"]["value"] = True
    (root / _RULE_PACK_REL).write_text(json.dumps(package, ensure_ascii=False, indent=2), encoding="utf-8")
    return JsonPolicyBundleStore(root)


def _outcome(artifacts) -> dict:
    return {
        "reasons": sorted(d.get("decision_reason_code") for d in artifacts.decisions),
        "effect_status_counts": artifacts.summary.get("effect_status_counts"),
        "pooled": artifacts.summary.get("pooled_content_count"),
        "rejected": artifacts.summary.get("rejected_content_count"),
    }


def _variant_overrides(variant: str, cfg_dir: Path):
    if variant == "default":
        return None
    if variant == "senior_block":
        return {"policy_store": _senior_block_store(cfg_dir)}
    raise ValueError(variant)


@pytest.mark.parametrize("variant", ["default", "senior_block"])
def test_matrix_real_id45(variant, tmp_path):
    overrides = _variant_overrides(variant, tmp_path / "cfg")
    artifacts = replay_case("real_id45", runtime_root=tmp_path / "rt", config_overrides=overrides)
    assert artifacts.state["status"] == "success"  # config change must not break the chain
    assert_matches(f"matrix/real_id45__{variant}", _outcome(artifacts))


def test_senior_block_changes_outcome(tmp_path):
    base = _outcome(replay_case("real_id45", runtime_root=tmp_path / "rt0"))
    blocked = _outcome(
        replay_case(
            "real_id45",
            runtime_root=tmp_path / "rt1",
            config_overrides={"policy_store": _senior_block_store(tmp_path / "cfg")},
        )
    )
    # Decoupling proof: one config edit on the not_fit_senior gate visibly moves the outcome.
    assert base != blocked
    # Default: no item is blocked by the senior-fit gate; items flow into pool / review.
    assert "content_not_fit_senior" not in base["reasons"]
    assert base["effect_status_counts"]["rule_blocked"] == 0
    # R3 第二步: 四字段热度复合后 real_id45 默认 3 进池(原 2)。
    assert base["pooled"] == 3
    # Blocked variant: every item trips the (config-inverted) hard gate -> rule_blocked reject.
    assert blocked["reasons"] == ["content_not_fit_senior"] * 4
    assert blocked["effect_status_counts"]["rule_blocked"] == 4
    assert blocked["pooled"] == 0
    assert blocked["rejected"] == 4


def test_matrix_query_profile_variant():
    from scripts.validate_query_prompts_config import validate_query_prompts_config

    config = json.loads((ROOT / "product_documents/配置/query_prompts.v1.json").read_text(encoding="utf-8"))
    assert validate_query_prompts_config(config) == []


def test_decoupling_counterproof():
    # M3A removed the Content hardcode: dispatch is parametrized by target_entity,
    # so a non-Content (e.g. Author) pack can be routed without falling back.
    source = (ROOT / "content_agent/integrations/policy_json.py").read_text(encoding="utf-8")
    assert 'target_entity") == "Content"' not in source


def test_senior_block_blocks_all_walk_expansion(tmp_path):
    # M4 受控变化: 全拦截(rule_blocked)时翻页/作者/tag 全停;砍包后 path_stop 戳=内容包。
    artifacts = replay_case(
        "real_id45",
        runtime_root=tmp_path / "rt",
        config_overrides={"policy_store": _senior_block_store(tmp_path / "cfg")},
    )
    walk_actions = artifacts.files["walk_actions.jsonl"]

    assert not [row for row in walk_actions if row["edge_id"] == "query_next_page"]
    expansions = [
        row for row in walk_actions if row["edge_id"] in {"author_to_works", "hashtag_to_query"}
    ]
    assert expansions
    assert all(row["walk_status"] == "skipped" for row in expansions)
    assert all(row["reason_code"] == "blocked_by_rule_decision" for row in expansions)

    path_stops = [row for row in walk_actions if row["edge_id"] == "path_stop"]
    assert len(path_stops) == 4
    for row in path_stops:
        assert row["rule_pack_id"] == "douyin_content_discovery_rule_pack_v1"
        assert row["raw_payload"]["rule_pack_execution"]["executed_rule_pack_id"] == (
            "douyin_content_discovery_rule_pack_v1"
        )