validate logs response

Dylan Huang · Dylan Huang · commit 8104c85fae01 · 2025-10-02T18:39:47.000-07:00
diff --git a/eval_protocol/utils/logs_models.py b/eval_protocol/utils/logs_models.py
@@ -0,0 +1,45 @@
+"""
+Pydantic models for the logs server API.
+
+This module contains data models that match the TypeScript schemas in eval-protocol.ts
+to ensure consistent data structure between Python backend and TypeScript frontend.
+"""
+
+from typing import Any, List, Optional
+from pydantic import BaseModel, ConfigDict, Field
+
+
+class LogEntry(BaseModel):
+    """
+    Represents a single log entry from Elasticsearch.
+
+    This model matches the LogEntrySchema in eval-protocol.ts to ensure
+    consistent data structure between Python backend and TypeScript frontend.
+    """
+
+    timestamp: str = Field(..., alias="@timestamp", description="ISO 8601 timestamp of the log entry")
+    level: str = Field(..., description="Log level (DEBUG, INFO, WARNING, ERROR)")
+    message: str = Field(..., description="The log message")
+    logger_name: str = Field(..., description="Name of the logger that created this entry")
+    rollout_id: str = Field(..., description="ID of the rollout this log belongs to")
+    status_code: Optional[int] = Field(None, description="Optional status code")
+    status_message: Optional[str] = Field(None, description="Optional status message")
+    status_details: Optional[List[Any]] = Field(None, description="Optional status details")
+
+    model_config = ConfigDict(populate_by_name=True)
+
+
+class LogsResponse(BaseModel):
+    """
+    Response model for the get_logs endpoint.
+
+    This model matches the LogsResponseSchema in eval-protocol.ts to ensure
+    consistent data structure between Python backend and TypeScript frontend.
+    """
+
+    logs: List[LogEntry] = Field(..., description="Array of log entries")
+    total: int = Field(..., description="Total number of logs available")
+    rollout_id: str = Field(..., description="The rollout ID these logs belong to")
+    filtered_by_level: Optional[str] = Field(None, description="Log level filter applied")
+
+    model_config = ConfigDict()
diff --git a/eval_protocol/utils/logs_server.py b/eval_protocol/utils/logs_server.py
@@ -20,6 +20,7 @@
 from eval_protocol.utils.vite_server import ViteServer
 from eval_protocol.logging.elasticsearch_client import ElasticsearchClient
 from eval_protocol.types.remote_rollout_processor import ElasticsearchConfig
+from eval_protocol.utils.logs_models import LogEntry, LogsResponse
 
 if TYPE_CHECKING:
     from eval_protocol.models import EvaluationRow
@@ -339,12 +340,12 @@ async def status():
                 "elasticsearch_enabled": self.elasticsearch_client is not None,
             }
 
-        @self.app.get("/api/logs/{rollout_id}")
+        @self.app.get("/api/logs/{rollout_id}", response_model=LogsResponse, response_model_exclude_none=True)
         async def get_logs(
             rollout_id: str,
             level: Optional[str] = Query(None, description="Filter by log level (DEBUG, INFO, WARNING, ERROR)"),
             limit: int = Query(100, description="Maximum number of log entries to return"),
-        ):
+        ) -> LogsResponse:
             """Get logs for a specific rollout ID from Elasticsearch."""
             if not self.elasticsearch_client:
                 raise HTTPException(status_code=503, detail="Elasticsearch is not configured for this logs server")
@@ -354,20 +355,35 @@ async def get_logs(
                 search_results = self.elasticsearch_client.search_by_match("rollout_id", rollout_id, size=limit)
 
                 if not search_results or "hits" not in search_results:
-                    return {"logs": [], "total": 0}
-
-                logs = []
+                    # Return empty response using Pydantic model
+                    return LogsResponse(
+                        logs=[],
+                        total=0,
+                        rollout_id=rollout_id,
+                        filtered_by_level=level,
+                    )
+
+                log_entries = []
                 for hit in search_results["hits"]["hits"]:
-                    log_entry = hit["_source"]
+                    log_data = hit["_source"]
 
                     # Filter by level if specified
-                    if level and log_entry.get("level") != level:
+                    if level and log_data.get("level") != level:
                         continue
 
-                    logs.append(log_entry)
+                    # Create LogEntry using Pydantic model for validation
+                    try:
+                        log_entry = LogEntry(
+                            **log_data  # Use ** to unpack the dict, Pydantic will handle field mapping
+                        )
+                        log_entries.append(log_entry)
+                    except Exception as e:
+                        # Log the error but continue processing other entries
+                        logger.warning(f"Failed to parse log entry: {e}, data: {log_data}")
+                        continue
 
                 # Sort by timestamp (most recent first)
-                logs.sort(key=lambda x: x.get("@timestamp", ""), reverse=True)
+                log_entries.sort(key=lambda x: x.timestamp, reverse=True)
 
                 # Get total count
                 total_hits = search_results["hits"]["total"]
@@ -378,12 +394,13 @@ async def get_logs(
                     # Elasticsearch 6 format
                     total_count = total_hits
 
-                return {
-                    "logs": logs,
-                    "total": total_count,
-                    "rollout_id": rollout_id,
-                    "filtered_by_level": level,
-                }
+                # Return response using Pydantic model
+                return LogsResponse(
+                    logs=log_entries,
+                    total=total_count,
+                    rollout_id=rollout_id,
+                    filtered_by_level=level,
+                )
 
             except Exception as e:
                 logger.error(f"Error retrieving logs for rollout {rollout_id}: {e}")