We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 849ed7e commit 0031c0fCopy full SHA for 0031c0f
1 file changed
models.py
@@ -62,6 +62,14 @@ class SignalSnapshot(BaseModel):
62
class OpsGauntletObservation(Observation):
63
"""Observation returned after reset and each step."""
64
65
+ # Override base-class reward with strict (0, 1) float constraint so the
66
+ # JSON schema explicitly tells the validator that values are bounded.
67
+ reward: float = Field(
68
+ default=0.5,
69
+ gt=0.0,
70
+ lt=1.0,
71
+ description="Reward signal from the last action, strictly between 0 and 1.",
72
+ )
73
task_id: str = Field(..., description="Current task identifier.")
74
title: str = Field(..., description="Short task title.")
75
difficulty: str = Field(..., description="Task difficulty bucket.")
0 commit comments