Skip to content

Eval Protocol Rollout #5

Eval Protocol Rollout

Eval Protocol Rollout #5

Workflow file for this run

name: Eval Protocol Rollout
on:
workflow_dispatch:
inputs:
model:
description: 'Model to use for the rollout'
required: true
type: string
rollout_id:
description: 'Rollout ID for tracking'
required: true
type: string
messages_b64:
description: 'Base64 encoded JSON messages array'
required: true
type: string
tools_b64:
description: 'Base64 encoded JSON tools array (optional)'
required: false
type: string
jobs:
rollout:
runs-on: ubuntu-latest
name: rollout-${{ inputs.rollout_id }}
steps:
- name: Checkout code
uses: actions/checkout@v4
- name: Set up Python
uses: actions/setup-python@v5
with:
python-version: '3.11'
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install -e .
- name: Run rollout script
env:
FIREWORKS_API_KEY: ${{ secrets.FIREWORKS_API_KEY }}
run: |
python tests/github_actions/rollout_worker.py \
--model "${{ inputs.model }}" \
--rollout-id "${{ inputs.rollout_id }}" \
--messages-b64 "${{ inputs.messages_b64 }}" \
${{ inputs.tools_b64 && format('--tools-b64 "{0}"', inputs.tools_b64) || '' }}
- name: Upload rollout trace
uses: actions/upload-artifact@v4
if: always() # Upload even if the rollout failed
with:
name: rollout-trace-${{ inputs.rollout_id }}
path: rollout_trace_${{ inputs.rollout_id }}.json
retention-days: 7