-
Notifications
You must be signed in to change notification settings - Fork 16
Expand file tree
/
Copy pathtest_pytest_default_agent_rollout_processor.py
More file actions
29 lines (26 loc) · 1.31 KB
/
test_pytest_default_agent_rollout_processor.py
File metadata and controls
29 lines (26 loc) · 1.31 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
from datetime import datetime
from typing import List
from eval_protocol.models import EvaluationRow, Message, EvaluateResult
from eval_protocol.pytest import AgentRolloutProcessor, evaluation_test
@evaluation_test(
input_messages=[
[
[
Message(
role="user",
content="Can you give a summary of the past week in the 'general, model-requests, bug-reports, questions, and feature-requests' channels. For EVERY message or thread has not been resolved, please list them at the end of your response in a table. Be sure to include the exact message, severity, and current status so far. Current Date & Time: {current_date_time}".format(
current_date_time=datetime.now().strftime("%B %d, %Y at %I:%M %p")
),
)
]
]
],
rollout_processor=AgentRolloutProcessor(),
completion_params=[{"model": "fireworks_ai/accounts/fireworks/models/kimi-k2-instruct-0905"}],
mode="all",
)
def test_pytest_default_agent_rollout_processor(rows: List[EvaluationRow]) -> List[EvaluationRow]:
"""Run math evaluation on sample dataset using pytest interface."""
for row in rows:
row.evaluation_result = EvaluateResult(score=0.0, reason="Dummy evaluation result")
return rows