|
| 1 | +import uuid |
| 2 | + |
| 3 | +from opentelemetry.sdk.trace import ReadableSpan |
| 4 | + |
| 5 | +from uipath.eval.evaluators import LegacyTrajectoryEvaluator |
| 6 | +from uipath.eval.evaluators.base_legacy_evaluator import LegacyEvaluationCriteria |
| 7 | +from uipath.eval.evaluators.legacy_trajectory_evaluator import ( |
| 8 | + LegacyTrajectoryEvaluatorConfig, |
| 9 | +) |
| 10 | +from uipath.eval.models.models import LegacyEvaluatorCategory, LegacyEvaluatorType |
| 11 | + |
| 12 | + |
| 13 | +def _legacy_trajectory_evaluator() -> LegacyTrajectoryEvaluator: |
| 14 | + return LegacyTrajectoryEvaluator( |
| 15 | + id=str(uuid.uuid4()), |
| 16 | + name="Legacy trajectory", |
| 17 | + config_type=LegacyTrajectoryEvaluatorConfig, |
| 18 | + evaluation_criteria_type=LegacyEvaluationCriteria, |
| 19 | + justification_type=str, |
| 20 | + category=LegacyEvaluatorCategory.Trajectory, |
| 21 | + type=LegacyEvaluatorType.Trajectory, |
| 22 | + prompt="History:\n{{AgentRunHistory}}\nExpected:\n{{ExpectedAgentBehavior}}", |
| 23 | + createdAt="2026-05-14T00:00:00Z", |
| 24 | + updatedAt="2026-05-14T00:00:00Z", |
| 25 | + ) |
| 26 | + |
| 27 | + |
| 28 | +def test_legacy_trajectory_prompt_uses_compact_tool_history() -> None: |
| 29 | + long_prompt = "SYSTEM_PROMPT_" + ("x" * 10_000) |
| 30 | + spans = [ |
| 31 | + ReadableSpan( |
| 32 | + name="agent_llm_call", |
| 33 | + start_time=0, |
| 34 | + end_time=1, |
| 35 | + attributes={ |
| 36 | + "openinference.span.kind": "LLM", |
| 37 | + "input.value": f'{{"messages": [{{"role": "system", "content": "{long_prompt}"}}]}}', |
| 38 | + "output.value": '{"generations": []}', |
| 39 | + }, |
| 40 | + ), |
| 41 | + ReadableSpan( |
| 42 | + name="search_profiles", |
| 43 | + start_time=1, |
| 44 | + end_time=2, |
| 45 | + attributes={ |
| 46 | + "openinference.span.kind": "TOOL", |
| 47 | + "tool.name": "search_profiles", |
| 48 | + "input.value": '{"query": "mentor"}', |
| 49 | + "output.value": '{"content": "found mentor profile"}', |
| 50 | + "metadata": f'{{"agent_prompt": "{long_prompt}"}}', |
| 51 | + }, |
| 52 | + ), |
| 53 | + ] |
| 54 | + |
| 55 | + prompt = _legacy_trajectory_evaluator()._create_evaluation_prompt( |
| 56 | + expected_agent_behavior="The agent should search matching profiles.", |
| 57 | + agent_run_history=spans, |
| 58 | + ) |
| 59 | + |
| 60 | + assert "SYSTEM_PROMPT_" not in prompt |
| 61 | + assert "Tool: search_profiles" in prompt |
| 62 | + assert '{"query": "mentor"}' in prompt |
| 63 | + assert "found mentor profile" in prompt |
| 64 | + assert "agent_llm_call" not in prompt |
0 commit comments