From 0b2771f537442d051cb84033b188434177af9cb0 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Wed, 17 Dec 2025 19:24:44 -0800
Subject: [PATCH 01/27] perf: implement event-sourced architecture

---
 .changeset/event-sourced-entities.md          |  14 +
 packages/cli/src/lib/inspect/output.ts        |   2 +-
 packages/cli/src/lib/inspect/run.ts           |   2 +-
 packages/core/src/events-consumer.test.ts     |  92 ++-
 packages/core/src/events-consumer.ts          |   5 +
 packages/core/src/global.ts                   |   1 +
 packages/core/src/runtime.ts                  |  83 ++-
 packages/core/src/runtime/start.ts            |  32 +-
 packages/core/src/runtime/step-handler.ts     | 100 ++-
 .../core/src/runtime/suspension-handler.ts    | 365 ++++------
 packages/core/src/step.ts                     |  55 +-
 packages/core/src/workflow.test.ts            |  44 +-
 packages/core/src/workflow.ts                 |  21 +
 .../src/api/workflow-server-actions.ts        |   6 +-
 .../src/sidebar/attribute-panel.tsx           |  65 ++
 .../trace-span-construction.ts                |   4 +-
 .../lib/flow-graph/graph-execution-mapper.ts  |  14 +-
 packages/world-local/src/storage.test.ts      | 463 ++++++------
 packages/world-local/src/storage.ts           | 598 ++++++++++------
 packages/world-postgres/src/drizzle/schema.ts |  17 +-
 packages/world-postgres/src/storage.ts        | 656 ++++++++++--------
 packages/world-postgres/test/storage.test.ts  | 413 ++++++-----
 packages/world-vercel/src/events.ts           |  34 +-
 packages/world-vercel/src/steps.ts            |  77 +-
 packages/world-vercel/src/storage.ts          |  34 +-
 packages/world/src/events.ts                  | 184 ++++-
 packages/world/src/interfaces.ts              |  75 +-
 packages/world/src/steps.ts                   |  15 +-
 28 files changed, 2078 insertions(+), 1393 deletions(-)
 create mode 100644 .changeset/event-sourced-entities.md

diff --git a/.changeset/event-sourced-entities.md b/.changeset/event-sourced-entities.md
new file mode 100644
index 000000000..27cdb84c0
--- /dev/null
+++ b/.changeset/event-sourced-entities.md
@@ -0,0 +1,14 @@
+---
+"@workflow/core": patch
+"@workflow/world": patch
+"@workflow/world-local": patch
+"@workflow/world-postgres": patch
+"@workflow/world-vercel": patch
+---
+
+perf: implement event-sourced architecture for runs, steps, and hooks
+
+- Add run lifecycle events (run_created, run_started, run_completed, run_failed, run_cancelled, run_paused, run_resumed)
+- Update world implementations to create/update entities from events via events.create()
+- Entities (runs, steps, hooks) are now materializations of the event log
+- This makes the system faster, easier to reason about, and resilient to data inconsistencies
diff --git a/packages/cli/src/lib/inspect/output.ts b/packages/cli/src/lib/inspect/output.ts
index 75700d15f..f1869c006 100644
--- a/packages/cli/src/lib/inspect/output.ts
+++ b/packages/cli/src/lib/inspect/output.ts
@@ -50,7 +50,7 @@ const STEP_LISTED_PROPS: (keyof Step)[] = [
   'stepId',
   'stepName',
   'status',
-  'startedAt',
+  'firstStartedAt',
   'completedAt',
   ...STEP_IO_PROPS,
 ];
diff --git a/packages/cli/src/lib/inspect/run.ts b/packages/cli/src/lib/inspect/run.ts
index 8a4f0f2f2..6827e3aa8 100644
--- a/packages/cli/src/lib/inspect/run.ts
+++ b/packages/cli/src/lib/inspect/run.ts
@@ -68,6 +68,6 @@ export const startRun = async (
 };
 
 export const cancelRun = async (world: World, runId: string) => {
-  await world.runs.cancel(runId);
+  await world.events.create(runId, { eventType: 'run_cancelled' });
   logger.log(chalk.green(`Cancel signal sent to run ${runId}`));
 };
diff --git a/packages/core/src/events-consumer.test.ts b/packages/core/src/events-consumer.test.ts
index dfb73e2ae..90fd141ab 100644
--- a/packages/core/src/events-consumer.test.ts
+++ b/packages/core/src/events-consumer.test.ts
@@ -73,6 +73,7 @@ describe('EventsConsumer', () => {
       await waitForNextTick();
 
       expect(callback).toHaveBeenCalledWith(event);
+      // Without auto-advance, callback is only called once
       expect(callback).toHaveBeenCalledTimes(1);
     });
   });
@@ -87,6 +88,7 @@ describe('EventsConsumer', () => {
       await waitForNextTick();
 
       expect(callback).toHaveBeenCalledWith(event);
+      // Without auto-advance, callback is only called once
       expect(callback).toHaveBeenCalledTimes(1);
     });
 
@@ -109,23 +111,27 @@ describe('EventsConsumer', () => {
       consumer.subscribe(callback);
       await waitForNextTick();
 
+      // callback finishes at event1, index advances to 1
+      // Without auto-advance, event2 is NOT processed
       expect(consumer.eventIndex).toBe(1);
       expect(consumer.callbacks).toHaveLength(0);
     });
 
-    it('should not increment event index when callback returns false', async () => {
+    it('should NOT auto-advance when all callbacks return NotConsumed', async () => {
       const event = createMockEvent();
       const consumer = new EventsConsumer([event]);
       const callback = vi.fn().mockReturnValue(EventConsumerResult.NotConsumed);
 
       consumer.subscribe(callback);
       await waitForNextTick();
+      await waitForNextTick(); // Extra tick to confirm no auto-advance
 
+      // Without auto-advance, eventIndex stays at 0
       expect(consumer.eventIndex).toBe(0);
       expect(consumer.callbacks).toContain(callback);
     });
 
-    it('should process multiple callbacks until one returns true', async () => {
+    it('should process multiple callbacks until one returns Consumed or Finished', async () => {
       const event = createMockEvent();
       const consumer = new EventsConsumer([event]);
       const callback1 = vi
@@ -140,15 +146,17 @@ describe('EventsConsumer', () => {
       consumer.subscribe(callback2);
       consumer.subscribe(callback3);
       await waitForNextTick();
+      await waitForNextTick(); // For next event processing
 
       expect(callback1).toHaveBeenCalledWith(event);
       expect(callback2).toHaveBeenCalledWith(event);
+      // callback3 sees the next event (null since we only have one event)
       expect(callback3).toHaveBeenCalledWith(null);
       expect(consumer.eventIndex).toBe(1);
       expect(consumer.callbacks).toEqual([callback1, callback3]);
     });
 
-    it('should process all callbacks when none return true', async () => {
+    it('should NOT advance when all callbacks return NotConsumed', async () => {
       const event = createMockEvent();
       const consumer = new EventsConsumer([event]);
       const callback1 = vi
@@ -169,6 +177,7 @@ describe('EventsConsumer', () => {
       expect(callback1).toHaveBeenCalledWith(event);
       expect(callback2).toHaveBeenCalledWith(event);
       expect(callback3).toHaveBeenCalledWith(event);
+      // Without auto-advance, eventIndex stays at 0
       expect(consumer.eventIndex).toBe(0);
       expect(consumer.callbacks).toEqual([callback1, callback2, callback3]);
     });
@@ -211,7 +220,7 @@ describe('EventsConsumer', () => {
       expect(callback2).toHaveBeenCalledWith(null);
     });
 
-    it('should handle complex event processing scenario', async () => {
+    it('should handle complex event processing with multiple consumers', async () => {
       const events = [
         createMockEvent({ id: 'event-1', event_type: 'type-a' }),
         createMockEvent({ id: 'event-2', event_type: 'type-b' }),
@@ -241,13 +250,14 @@ describe('EventsConsumer', () => {
       consumer.subscribe(typeBCallback);
       await waitForNextTick();
       await waitForNextTick(); // Wait for recursive processing
-      await waitForNextTick(); // Wait for final processing
 
-      // typeACallback processes event-1 and gets removed, so it won't process event-3
+      // typeACallback processes event-1 and gets removed
       expect(typeACallback).toHaveBeenCalledTimes(1); // Called for event-1 only
+      // typeBCallback processes event-2 and gets removed
       expect(typeBCallback).toHaveBeenCalledTimes(1); // Called for event-2
-      expect(consumer.eventIndex).toBe(2); // Only 2 events processed (event-3 remains)
-      expect(consumer.callbacks).toHaveLength(0); // Both callbacks removed after consuming their events
+      // eventIndex is at 2 (after event-1 and event-2 were consumed)
+      expect(consumer.eventIndex).toBe(2);
+      expect(consumer.callbacks).toHaveLength(0);
     });
   });
 
@@ -297,8 +307,9 @@ describe('EventsConsumer', () => {
       consumer.subscribe(callback3);
       await waitForNextTick();
 
-      // callback2 should be removed when it returns true
+      // callback2 should be removed when it returns Finished
       expect(consumer.callbacks).toEqual([callback1, callback3]);
+      // callback3 is called with the next event (null after event-1)
       expect(callback3).toHaveBeenCalledWith(null);
     });
 
@@ -314,25 +325,6 @@ describe('EventsConsumer', () => {
       expect(consumer.eventIndex).toBe(1);
     });
 
-    it('should handle multiple subscriptions happening in sequence', async () => {
-      const event1 = createMockEvent({ id: 'event-1' });
-      const event2 = createMockEvent({ id: 'event-2' });
-      const consumer = new EventsConsumer([event1, event2]);
-
-      const callback1 = vi.fn().mockReturnValue(EventConsumerResult.Finished);
-      const callback2 = vi.fn().mockReturnValue(EventConsumerResult.Finished);
-
-      consumer.subscribe(callback1);
-      await waitForNextTick();
-
-      consumer.subscribe(callback2);
-      await waitForNextTick();
-
-      expect(callback1).toHaveBeenCalledWith(event1);
-      expect(callback2).toHaveBeenCalledWith(event2);
-      expect(consumer.eventIndex).toBe(2);
-    });
-
     it('should handle empty events array gracefully', async () => {
       const consumer = new EventsConsumer([]);
       const callback = vi.fn().mockReturnValue(EventConsumerResult.NotConsumed);
@@ -343,5 +335,49 @@ describe('EventsConsumer', () => {
       expect(callback).toHaveBeenCalledWith(null);
       expect(consumer.eventIndex).toBe(0);
     });
+
+    it('should process events in order with proper consumers', async () => {
+      // This test simulates the workflow scenario:
+      // - run_created consumer consumes it
+      // - step consumer gets step_created, step_completed
+      const events = [
+        createMockEvent({ id: 'run-created', event_type: 'run_created' }),
+        createMockEvent({ id: 'step-created', event_type: 'step_created' }),
+        createMockEvent({ id: 'step-completed', event_type: 'step_completed' }),
+      ];
+      const consumer = new EventsConsumer(events);
+
+      // Run lifecycle consumer - consumes run_created
+      const runConsumer = vi.fn().mockImplementation((event: Event | null) => {
+        if (event?.event_type === 'run_created') {
+          return EventConsumerResult.Consumed;
+        }
+        return EventConsumerResult.NotConsumed;
+      });
+
+      // Step consumer - consumes step_created, finishes on step_completed
+      const stepConsumer = vi.fn().mockImplementation((event: Event | null) => {
+        if (event?.event_type === 'step_created') {
+          return EventConsumerResult.Consumed;
+        }
+        if (event?.event_type === 'step_completed') {
+          return EventConsumerResult.Finished;
+        }
+        return EventConsumerResult.NotConsumed;
+      });
+
+      consumer.subscribe(runConsumer);
+      consumer.subscribe(stepConsumer);
+      await waitForNextTick();
+      await waitForNextTick();
+      await waitForNextTick();
+
+      // runConsumer consumes run_created
+      expect(runConsumer).toHaveBeenCalledWith(events[0]);
+      // stepConsumer consumes step_created, then finishes on step_completed
+      expect(stepConsumer).toHaveBeenCalledWith(events[1]);
+      expect(stepConsumer).toHaveBeenCalledWith(events[2]);
+      expect(consumer.eventIndex).toBe(3);
+    });
   });
 });
diff --git a/packages/core/src/events-consumer.ts b/packages/core/src/events-consumer.ts
index f38d7fbd6..221d111fa 100644
--- a/packages/core/src/events-consumer.ts
+++ b/packages/core/src/events-consumer.ts
@@ -78,5 +78,10 @@ export class EventsConsumer {
         return;
       }
     }
+
+    // If we reach here, all callbacks returned NotConsumed.
+    // We do NOT auto-advance - every event must have a consumer.
+    // With proper consumers for run_created/run_started/step_created,
+    // this should not cause events to get stuck.
   };
 }
diff --git a/packages/core/src/global.ts b/packages/core/src/global.ts
index 17a680dc4..7f1853512 100644
--- a/packages/core/src/global.ts
+++ b/packages/core/src/global.ts
@@ -6,6 +6,7 @@ export interface StepInvocationQueueItem {
   stepName: string;
   args: Serializable[];
   closureVars?: Record<string, Serializable>;
+  hasCreatedEvent?: boolean;
 }
 
 export interface HookInvocationQueueItem {
diff --git a/packages/core/src/runtime.ts b/packages/core/src/runtime.ts
index cf38e3bcf..ae02b408d 100644
--- a/packages/core/src/runtime.ts
+++ b/packages/core/src/runtime.ts
@@ -104,7 +104,9 @@ export class Run<TResult> {
    * Cancels the workflow run.
    */
   async cancel(): Promise<void> {
-    await this.world.runs.cancel(this.runId);
+    await this.world.events.create(this.runId, {
+      eventType: 'run_cancelled',
+    });
   }
 
   /**
@@ -272,10 +274,14 @@ export function workflowEntrypoint(
               let workflowRun = await world.runs.get(runId);
 
               if (workflowRun.status === 'pending') {
-                workflowRun = await world.runs.update(runId, {
-                  // This sets the `startedAt` timestamp at the database level
-                  status: 'running',
+                // Transition run to 'running' via event (event-sourced architecture)
+                const result = await world.events.create(runId, {
+                  eventType: 'run_started',
                 });
+                // Use the run entity from the event response (no extra get call needed)
+                if (result.run) {
+                  workflowRun = result.run;
+                }
               }
 
               // At this point, the workflow is "running" and `startedAt` should
@@ -310,27 +316,35 @@ export function workflowEntrypoint(
               // Load all events into memory before running
               const events = await getAllWorkflowRunEvents(workflowRun.runId);
 
-              // Check for any elapsed waits and create wait_completed events
+              // Check for any elapsed waits and batch create wait_completed events
               const now = Date.now();
-              for (const event of events) {
-                if (event.eventType === 'wait_created') {
-                  const resumeAt = event.eventData.resumeAt as Date;
-                  const hasCompleted = events.some(
-                    (e) =>
-                      e.eventType === 'wait_completed' &&
-                      e.correlationId === event.correlationId
-                  );
 
-                  // If wait has elapsed and hasn't been completed yet
-                  if (!hasCompleted && now >= resumeAt.getTime()) {
-                    const completedEvent = await world.events.create(runId, {
-                      eventType: 'wait_completed',
-                      correlationId: event.correlationId,
-                    });
-                    // Add the event to the events array so the workflow can see it
-                    events.push(completedEvent);
-                  }
-                }
+              // Pre-compute completed correlation IDs for O(n) lookup instead of O(n²)
+              const completedWaitIds = new Set(
+                events
+                  .filter((e) => e.eventType === 'wait_completed')
+                  .map((e) => e.correlationId)
+              );
+
+              // Collect all waits that need completion
+              const waitsToComplete = events
+                .filter(
+                  (e): e is typeof e & { correlationId: string } =>
+                    e.eventType === 'wait_created' &&
+                    e.correlationId !== undefined &&
+                    !completedWaitIds.has(e.correlationId) &&
+                    now >= (e.eventData.resumeAt as Date).getTime()
+                )
+                .map((e) => ({
+                  eventType: 'wait_completed' as const,
+                  correlationId: e.correlationId,
+                }));
+
+              // Create all wait_completed events
+              for (const waitEvent of waitsToComplete) {
+                const result = await world.events.create(runId, waitEvent);
+                // Add the event to the events array so the workflow can see it
+                events.push(result.event);
               }
 
               const result = await runWorkflow(
@@ -339,10 +353,12 @@ export function workflowEntrypoint(
                 events
               );
 
-              // Update the workflow run with the result
-              await world.runs.update(runId, {
-                status: 'completed',
-                output: result as Serializable,
+              // Complete the workflow run via event (event-sourced architecture)
+              await world.events.create(runId, {
+                eventType: 'run_completed',
+                eventData: {
+                  output: result as Serializable,
+                },
               });
 
               span?.setAttributes({
@@ -393,11 +409,14 @@ export function workflowEntrypoint(
                 console.error(
                   `${errorName} while running "${runId}" workflow:\n\n${errorStack}`
                 );
-                await world.runs.update(runId, {
-                  status: 'failed',
-                  error: {
-                    message: errorMessage,
-                    stack: errorStack,
+                // Fail the workflow run via event (event-sourced architecture)
+                await world.events.create(runId, {
+                  eventType: 'run_failed',
+                  eventData: {
+                    error: {
+                      message: errorMessage,
+                      stack: errorStack,
+                    },
                     // TODO: include error codes when we define them
                   },
                 });
diff --git a/packages/core/src/runtime/start.ts b/packages/core/src/runtime/start.ts
index 687bf012b..2c43395f5 100644
--- a/packages/core/src/runtime/start.ts
+++ b/packages/core/src/runtime/start.ts
@@ -92,22 +92,30 @@ export async function start<TArgs extends unknown[], TResult>(
       const { promise: runIdPromise, resolve: resolveRunId } =
         withResolvers<string>();
 
+      // Serialize current trace context to propagate across queue boundary
+      const traceCarrier = await serializeTraceCarrier();
+
+      // Create run via run_created event (event-sourced architecture)
+      // Pass null for runId - the server generates it and returns it in the response
       const workflowArguments = dehydrateWorkflowArguments(
         args,
         ops,
         runIdPromise
       );
-      // Serialize current trace context to propagate across queue boundary
-      const traceCarrier = await serializeTraceCarrier();
 
-      const runResponse = await world.runs.create({
-        deploymentId: deploymentId,
-        workflowName: workflowName,
-        input: workflowArguments,
-        executionContext: { traceCarrier },
+      const result = await world.events.create(null, {
+        eventType: 'run_created',
+        eventData: {
+          deploymentId: deploymentId,
+          workflowName: workflowName,
+          input: workflowArguments,
+          executionContext: { traceCarrier },
+        },
       });
 
-      resolveRunId(runResponse.runId);
+      // Get the server-generated runId from the event response
+      const runId = result.event.runId;
+      resolveRunId(runId);
 
       waitUntil(
         Promise.all(ops).catch((err) => {
@@ -119,15 +127,15 @@ export async function start<TArgs extends unknown[], TResult>(
       );
 
       span?.setAttributes({
-        ...Attribute.WorkflowRunId(runResponse.runId),
-        ...Attribute.WorkflowRunStatus(runResponse.status),
+        ...Attribute.WorkflowRunId(runId),
+        ...Attribute.WorkflowRunStatus('pending'),
         ...Attribute.DeploymentId(deploymentId),
       });
 
       await world.queue(
         `__wkf_workflow_${workflowName}`,
         {
-          runId: runResponse.runId,
+          runId,
           traceCarrier,
         } satisfies WorkflowInvokePayload,
         {
@@ -135,7 +143,7 @@ export async function start<TArgs extends unknown[], TResult>(
         }
       );
 
-      return new Run<TResult>(runResponse.runId);
+      return new Run<TResult>(runId);
     });
   });
 }
diff --git a/packages/core/src/runtime/step-handler.ts b/packages/core/src/runtime/step-handler.ts
index 5390ccada..a860f6d2c 100644
--- a/packages/core/src/runtime/step-handler.ts
+++ b/packages/core/src/runtime/step-handler.ts
@@ -114,23 +114,17 @@ const stepHandler = getWorldHandlers().createQueueHandler(
           }
 
           let result: unknown;
-          const attempt = step.attempt + 1;
 
           // Check max retries FIRST before any state changes.
+          // step.attempt tracks how many times step_started has been called.
+          // If step.attempt >= maxRetries, we've already tried maxRetries times.
           // This handles edge cases where the step handler is invoked after max retries have been exceeded
-          // (e.g., when the step repeatedly times out or fails before reaching the catch handler at line 822).
+          // (e.g., when the step repeatedly times out or fails before reaching the catch handler).
           // Without this check, the step would retry forever.
-          if (attempt > maxRetries) {
-            const errorMessage = `Step "${stepName}" exceeded max retries (${attempt} attempts)`;
+          if (step.attempt >= maxRetries) {
+            const errorMessage = `Step "${stepName}" exceeded max retries (${step.attempt} attempts)`;
             console.error(`[Workflows] "${workflowRunId}" - ${errorMessage}`);
-            // Update step status first (idempotent), then create event
-            await world.steps.update(workflowRunId, stepId, {
-              status: 'failed',
-              error: {
-                message: errorMessage,
-                stack: undefined,
-              },
-            });
+            // Fail the step via event (event-sourced architecture)
             await world.events.create(workflowRunId, {
               eventType: 'step_failed',
               correlationId: stepId,
@@ -192,19 +186,24 @@ const stepHandler = getWorldHandlers().createQueueHandler(
               return;
             }
 
-            await world.events.create(workflowRunId, {
-              eventType: 'step_started', // TODO: Replace with 'step_retrying'
+            // Start the step via event (event-sourced architecture)
+            // step_started increments the attempt counter in the World implementation
+            const startResult = await world.events.create(workflowRunId, {
+              eventType: 'step_started',
               correlationId: stepId,
             });
 
-            step = await world.steps.update(workflowRunId, stepId, {
-              attempt,
-              status: 'running',
-            });
+            // Use the step entity from the event response (no extra get call needed)
+            if (startResult.step) {
+              step = startResult.step;
+            }
 
-            if (!step.startedAt) {
+            // step.attempt is now the current attempt number (after increment)
+            const attempt = step.attempt;
+
+            if (!step.firstStartedAt) {
               throw new WorkflowRuntimeError(
-                `Step "${stepId}" has no "startedAt" timestamp`
+                `Step "${stepId}" has no "firstStartedAt" timestamp`
               );
             }
             // Hydrate the step input arguments and closure variables
@@ -225,7 +224,7 @@ const stepHandler = getWorldHandlers().createQueueHandler(
               {
                 stepMetadata: {
                   stepId,
-                  stepStartedAt: new Date(+step.startedAt),
+                  stepStartedAt: new Date(+step.firstStartedAt),
                   attempt,
                 },
                 workflowMetadata: {
@@ -257,16 +256,8 @@ const stepHandler = getWorldHandlers().createQueueHandler(
               })
             );
 
-            // Mark the step as completed first. This order is important. If a concurrent
-            // execution marked the step as complete, this request should throw, and
-            // this prevent the step_completed event in the event log
-            // TODO: this should really be atomic and handled by the world
-            await world.steps.update(workflowRunId, stepId, {
-              status: 'completed',
-              output: result as Serializable,
-            });
-
-            // Then, append the event log with the step result
+            // Complete the step via event (event-sourced architecture)
+            // The event creation atomically updates the step entity
             await world.events.create(workflowRunId, {
               eventType: 'step_completed',
               correlationId: stepId,
@@ -301,7 +292,7 @@ const stepHandler = getWorldHandlers().createQueueHandler(
               console.error(
                 `[Workflows] "${workflowRunId}" - Encountered \`FatalError\` while executing step "${stepName}":\n  > ${stackLines.join('\n    > ')}\n\nBubbling up error to parent workflow`
               );
-              // Fatal error - store the error in the event log and re-invoke the workflow
+              // Fail the step via event (event-sourced architecture)
               await world.events.create(workflowRunId, {
                 eventType: 'step_failed',
                 correlationId: stepId,
@@ -311,14 +302,6 @@ const stepHandler = getWorldHandlers().createQueueHandler(
                   fatal: true,
                 },
               });
-              await world.steps.update(workflowRunId, stepId, {
-                status: 'failed',
-                error: {
-                  message: err.message || String(err),
-                  stack: errorStack,
-                  // TODO: include error codes when we define them
-                },
-              });
 
               span?.setAttributes({
                 ...Attribute.StepStatus('failed'),
@@ -326,20 +309,23 @@ const stepHandler = getWorldHandlers().createQueueHandler(
               });
             } else {
               const maxRetries = stepFn.maxRetries ?? DEFAULT_STEP_MAX_RETRIES;
+              // step.attempt was incremented by step_started, use it here
+              const currentAttempt = step.attempt;
 
               span?.setAttributes({
-                ...Attribute.StepAttempt(attempt),
+                ...Attribute.StepAttempt(currentAttempt),
                 ...Attribute.StepMaxRetries(maxRetries),
               });
 
-              if (attempt > maxRetries) {
+              if (currentAttempt > maxRetries) {
                 // Max retries reached
                 const errorStack = getErrorStack(err);
                 const stackLines = errorStack.split('\n').slice(0, 4);
                 console.error(
-                  `[Workflows] "${workflowRunId}" - Encountered \`Error\` while executing step "${stepName}" (attempt ${attempt}):\n  > ${stackLines.join('\n    > ')}\n\n  Max retries reached\n  Bubbling error to parent workflow`
+                  `[Workflows] "${workflowRunId}" - Encountered \`Error\` while executing step "${stepName}" (attempt ${currentAttempt}):\n  > ${stackLines.join('\n    > ')}\n\n  Max retries reached\n  Bubbling error to parent workflow`
                 );
                 const errorMessage = `Step "${stepName}" failed after max retries: ${String(err)}`;
+                // Fail the step via event (event-sourced architecture)
                 await world.events.create(workflowRunId, {
                   eventType: 'step_failed',
                   correlationId: stepId,
@@ -349,13 +335,6 @@ const stepHandler = getWorldHandlers().createQueueHandler(
                     fatal: true,
                   },
                 });
-                await world.steps.update(workflowRunId, stepId, {
-                  status: 'failed',
-                  error: {
-                    message: errorMessage,
-                    stack: errorStack,
-                  },
-                });
 
                 span?.setAttributes({
                   ...Attribute.StepStatus('failed'),
@@ -365,30 +344,29 @@ const stepHandler = getWorldHandlers().createQueueHandler(
                 // Not at max retries yet - log as a retryable error
                 if (RetryableError.is(err)) {
                   console.warn(
-                    `[Workflows] "${workflowRunId}" - Encountered \`RetryableError\` while executing step "${stepName}" (attempt ${attempt}):\n  > ${String(err.message)}\n\n  This step has failed but will be retried`
+                    `[Workflows] "${workflowRunId}" - Encountered \`RetryableError\` while executing step "${stepName}" (attempt ${currentAttempt}):\n  > ${String(err.message)}\n\n  This step has failed but will be retried`
                   );
                 } else {
                   const stackLines = getErrorStack(err).split('\n').slice(0, 4);
                   console.error(
-                    `[Workflows] "${workflowRunId}" - Encountered \`Error\` while executing step "${stepName}" (attempt ${attempt}):\n  > ${stackLines.join('\n    > ')}\n\n  This step has failed but will be retried`
+                    `[Workflows] "${workflowRunId}" - Encountered \`Error\` while executing step "${stepName}" (attempt ${currentAttempt}):\n  > ${stackLines.join('\n    > ')}\n\n  This step has failed but will be retried`
                   );
                 }
+                // Set step to pending for retry via event (event-sourced architecture)
+                // step_retrying records the error in lastKnownError and sets status to pending
+                const errorStack = getErrorStack(err);
                 await world.events.create(workflowRunId, {
-                  eventType: 'step_failed',
+                  eventType: 'step_retrying',
                   correlationId: stepId,
                   eventData: {
                     error: String(err),
-                    stack: getErrorStack(err),
+                    stack: errorStack,
+                    ...(RetryableError.is(err) && {
+                      retryAfter: err.retryAfter,
+                    }),
                   },
                 });
 
-                await world.steps.update(workflowRunId, stepId, {
-                  status: 'pending', // TODO: Should be "retrying" once we have that status
-                  ...(RetryableError.is(err) && {
-                    retryAfter: err.retryAfter,
-                  }),
-                });
-
                 const timeoutSeconds = Math.max(
                   1,
                   RetryableError.is(err)
diff --git a/packages/core/src/runtime/suspension-handler.ts b/packages/core/src/runtime/suspension-handler.ts
index 11dcc81e7..493909c07 100644
--- a/packages/core/src/runtime/suspension-handler.ts
+++ b/packages/core/src/runtime/suspension-handler.ts
@@ -1,7 +1,7 @@
 import type { Span } from '@opentelemetry/api';
 import { waitUntil } from '@vercel/functions';
 import { WorkflowAPIError } from '@workflow/errors';
-import type { World } from '@workflow/world';
+import type { CreateEventRequest, World } from '@workflow/world';
 import type {
   HookInvocationQueueItem,
   StepInvocationQueueItem,
@@ -27,178 +27,14 @@ export interface SuspensionHandlerResult {
   timeoutSeconds?: number;
 }
 
-interface ProcessHookParams {
-  queueItem: HookInvocationQueueItem;
-  world: World;
-  runId: string;
-  global: typeof globalThis;
-}
-
-/**
- * Processes a single hook by creating it in the database and event log.
- */
-async function processHook({
-  queueItem,
-  world,
-  runId,
-  global,
-}: ProcessHookParams): Promise<void> {
-  try {
-    // Create hook in database
-    const hookMetadata =
-      typeof queueItem.metadata === 'undefined'
-        ? undefined
-        : dehydrateStepArguments(queueItem.metadata, global);
-    await world.hooks.create(runId, {
-      hookId: queueItem.correlationId,
-      token: queueItem.token,
-      metadata: hookMetadata,
-    });
-
-    // Create hook_created event in event log
-    await world.events.create(runId, {
-      eventType: 'hook_created',
-      correlationId: queueItem.correlationId,
-    });
-  } catch (err) {
-    if (WorkflowAPIError.is(err)) {
-      if (err.status === 409) {
-        // Hook already exists (duplicate hook_id constraint), so we can skip it
-        console.warn(
-          `Hook with correlation ID "${queueItem.correlationId}" already exists, skipping: ${err.message}`
-        );
-        return;
-      } else if (err.status === 410) {
-        // Workflow has already completed, so no-op
-        console.warn(
-          `Workflow run "${runId}" has already completed, skipping hook "${queueItem.correlationId}": ${err.message}`
-        );
-        return;
-      }
-    }
-    throw err;
-  }
-}
-
-interface ProcessStepParams {
-  queueItem: StepInvocationQueueItem;
-  world: World;
-  runId: string;
-  workflowName: string;
-  workflowStartedAt: number;
-  global: typeof globalThis;
-}
-
-/**
- * Processes a single step by creating it in the database and queueing execution.
- */
-async function processStep({
-  queueItem,
-  world,
-  runId,
-  workflowName,
-  workflowStartedAt,
-  global,
-}: ProcessStepParams): Promise<void> {
-  const ops: Promise<void>[] = [];
-  const dehydratedInput = dehydrateStepArguments(
-    {
-      args: queueItem.args,
-      closureVars: queueItem.closureVars,
-    },
-    global
-  );
-
-  try {
-    const step = await world.steps.create(runId, {
-      stepId: queueItem.correlationId,
-      stepName: queueItem.stepName,
-      input: dehydratedInput as Serializable,
-    });
-
-    waitUntil(
-      Promise.all(ops).catch((opErr) => {
-        // Ignore expected client disconnect errors (e.g., browser refresh during streaming)
-        const isAbortError =
-          opErr?.name === 'AbortError' || opErr?.name === 'ResponseAborted';
-        if (!isAbortError) throw opErr;
-      })
-    );
-
-    await queueMessage(
-      world,
-      `__wkf_step_${queueItem.stepName}`,
-      {
-        workflowName,
-        workflowRunId: runId,
-        workflowStartedAt,
-        stepId: step.stepId,
-        traceCarrier: await serializeTraceCarrier(),
-        requestedAt: new Date(),
-      },
-      {
-        idempotencyKey: queueItem.correlationId,
-      }
-    );
-  } catch (err) {
-    if (WorkflowAPIError.is(err) && err.status === 409) {
-      // Step already exists, so we can skip it
-      console.warn(
-        `Step "${queueItem.stepName}" with correlation ID "${queueItem.correlationId}" already exists, skipping: ${err.message}`
-      );
-      return;
-    }
-    throw err;
-  }
-}
-
-interface ProcessWaitParams {
-  queueItem: WaitInvocationQueueItem;
-  world: World;
-  runId: string;
-}
-
-/**
- * Processes a single wait by creating the event and calculating timeout.
- * @returns The timeout in seconds, or null if the wait already exists.
- */
-async function processWait({
-  queueItem,
-  world,
-  runId,
-}: ProcessWaitParams): Promise<number | null> {
-  try {
-    // Only create wait_created event if it hasn't been created yet
-    if (!queueItem.hasCreatedEvent) {
-      await world.events.create(runId, {
-        eventType: 'wait_created',
-        correlationId: queueItem.correlationId,
-        eventData: {
-          resumeAt: queueItem.resumeAt,
-        },
-      });
-    }
-
-    // Calculate how long to wait before resuming
-    const now = Date.now();
-    const resumeAtMs = queueItem.resumeAt.getTime();
-    const delayMs = Math.max(1000, resumeAtMs - now);
-    return Math.ceil(delayMs / 1000);
-  } catch (err) {
-    if (WorkflowAPIError.is(err) && err.status === 409) {
-      // Wait already exists, so we can skip it
-      console.warn(
-        `Wait with correlation ID "${queueItem.correlationId}" already exists, skipping: ${err.message}`
-      );
-      return null;
-    }
-    throw err;
-  }
-}
-
 /**
  * Handles a workflow suspension by processing all pending operations (hooks, steps, waits).
- * Hooks are processed first to prevent race conditions, then steps and waits in parallel.
+ * Uses an event-sourced architecture where entities (steps, hooks) are created atomically
+ * with their corresponding events via events.create().
+ *
+ * Processing order:
+ * 1. Hooks are processed first to prevent race conditions with webhook receivers
+ * 2. Steps and waits are processed in parallel after hooks complete
  */
 export async function handleSuspension({
   suspension,
@@ -208,7 +44,7 @@ export async function handleSuspension({
   workflowStartedAt,
   span,
 }: SuspensionHandlerParams): Promise<SuspensionHandlerResult> {
-  // Separate queue items by type for parallel processing
+  // Separate queue items by type
   const stepItems = suspension.steps.filter(
     (item): item is StepInvocationQueueItem => item.type === 'step'
   );
@@ -219,49 +55,157 @@ export async function handleSuspension({
     (item): item is WaitInvocationQueueItem => item.type === 'wait'
   );
 
-  // Process all hooks first to prevent race conditions
-  await Promise.all(
-    hookItems.map((queueItem) =>
-      processHook({
-        queueItem,
-        world,
-        runId,
-        global: suspension.globalThis,
+  // Build hook_created events (World will atomically create hook entities)
+  const hookEvents: CreateEventRequest[] = hookItems.map((queueItem) => {
+    const hookMetadata =
+      typeof queueItem.metadata === 'undefined'
+        ? undefined
+        : dehydrateStepArguments(queueItem.metadata, suspension.globalThis);
+    return {
+      eventType: 'hook_created' as const,
+      correlationId: queueItem.correlationId,
+      eventData: {
+        token: queueItem.token,
+        metadata: hookMetadata,
+      },
+    };
+  });
+
+  // Process hooks first to prevent race conditions with webhook receivers
+  // All hook creations run in parallel
+  if (hookEvents.length > 0) {
+    await Promise.all(
+      hookEvents.map(async (hookEvent) => {
+        try {
+          await world.events.create(runId, hookEvent);
+        } catch (err) {
+          if (WorkflowAPIError.is(err)) {
+            if (err.status === 409) {
+              console.warn(`Hook already exists, continuing: ${err.message}`);
+            } else if (err.status === 410) {
+              console.warn(
+                `Workflow run "${runId}" has already completed, skipping hook: ${err.message}`
+              );
+            } else {
+              throw err;
+            }
+          } else {
+            throw err;
+          }
+        }
       })
-    )
+    );
+  }
+
+  // Build a map of stepId -> step event for steps that need creation
+  const stepsNeedingCreation = new Set(
+    stepItems
+      .filter((queueItem) => !queueItem.hasCreatedEvent)
+      .map((queueItem) => queueItem.correlationId)
   );
 
-  // Then process steps and waits in parallel
-  const [, waitTimeouts] = await Promise.all([
-    Promise.all(
-      stepItems.map((queueItem) =>
-        processStep({
-          queueItem,
-          world,
-          runId,
-          workflowName,
-          workflowStartedAt,
-          global: suspension.globalThis,
-        })
-      )
-    ),
-    Promise.all(
-      waitItems.map((queueItem) =>
-        processWait({
-          queueItem,
+  // Process steps and waits in parallel
+  // Each step: create event (if needed) -> queue message
+  // Each wait: create event (if needed)
+  const ops: Promise<void>[] = [];
+
+  // Steps: create event then queue message, all in parallel
+  for (const queueItem of stepItems) {
+    ops.push(
+      (async () => {
+        // Create step event if not already created
+        if (stepsNeedingCreation.has(queueItem.correlationId)) {
+          const dehydratedInput = dehydrateStepArguments(
+            {
+              args: queueItem.args,
+              closureVars: queueItem.closureVars,
+            },
+            suspension.globalThis
+          );
+          const stepEvent: CreateEventRequest = {
+            eventType: 'step_created' as const,
+            correlationId: queueItem.correlationId,
+            eventData: {
+              stepName: queueItem.stepName,
+              input: dehydratedInput as Serializable,
+            },
+          };
+          try {
+            await world.events.create(runId, stepEvent);
+          } catch (err) {
+            if (WorkflowAPIError.is(err) && err.status === 409) {
+              console.warn(`Step already exists, continuing: ${err.message}`);
+            } else {
+              throw err;
+            }
+          }
+        }
+
+        // Queue step execution message
+        await queueMessage(
           world,
-          runId,
-        })
-      )
-    ),
-  ]);
+          `__wkf_step_${queueItem.stepName}`,
+          {
+            workflowName,
+            workflowRunId: runId,
+            workflowStartedAt,
+            stepId: queueItem.correlationId,
+            traceCarrier: await serializeTraceCarrier(),
+            requestedAt: new Date(),
+          },
+          {
+            idempotencyKey: queueItem.correlationId,
+          }
+        );
+      })()
+    );
+  }
+
+  // Waits: create events in parallel (no queueing needed for waits)
+  for (const queueItem of waitItems) {
+    if (!queueItem.hasCreatedEvent) {
+      ops.push(
+        (async () => {
+          const waitEvent: CreateEventRequest = {
+            eventType: 'wait_created' as const,
+            correlationId: queueItem.correlationId,
+            eventData: {
+              resumeAt: queueItem.resumeAt,
+            },
+          };
+          try {
+            await world.events.create(runId, waitEvent);
+          } catch (err) {
+            if (WorkflowAPIError.is(err) && err.status === 409) {
+              console.warn(`Wait already exists, continuing: ${err.message}`);
+            } else {
+              throw err;
+            }
+          }
+        })()
+      );
+    }
+  }
 
-  // Find minimum timeout from waits
-  const minTimeoutSeconds = waitTimeouts.reduce<number | null>(
-    (min, timeout) => {
-      if (timeout === null) return min;
-      if (min === null) return timeout;
-      return Math.min(min, timeout);
+  // Wait for all step and wait operations to complete
+  waitUntil(
+    Promise.all(ops).catch((opErr) => {
+      const isAbortError =
+        opErr?.name === 'AbortError' || opErr?.name === 'ResponseAborted';
+      if (!isAbortError) throw opErr;
+    })
+  );
+  await Promise.all(ops);
+
+  // Calculate minimum timeout from waits
+  const now = Date.now();
+  const minTimeoutSeconds = waitItems.reduce<number | null>(
+    (min, queueItem) => {
+      const resumeAtMs = queueItem.resumeAt.getTime();
+      const delayMs = Math.max(1000, resumeAtMs - now);
+      const timeoutSeconds = Math.ceil(delayMs / 1000);
+      if (min === null) return timeoutSeconds;
+      return Math.min(min, timeoutSeconds);
     },
     null
   );
@@ -273,7 +217,6 @@ export async function handleSuspension({
     ...Attribute.WorkflowWaitsCreated(waitItems.length),
   });
 
-  // If we encountered any waits, return the minimum timeout
   if (minTimeoutSeconds !== null) {
     return { timeoutSeconds: minTimeoutSeconds };
   }
diff --git a/packages/core/src/step.ts b/packages/core/src/step.ts
index f356f81f2..3f0e4563a 100644
--- a/packages/core/src/step.ts
+++ b/packages/core/src/step.ts
@@ -70,22 +70,24 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
           return EventConsumerResult.NotConsumed;
         }
 
+        if (event.eventType === 'step_created') {
+          // Step has been created (registered for execution) - mark as having event
+          // but keep in queue so suspension handler knows to queue execution without
+          // creating a duplicate step_created event
+          const queueItem = ctx.invocationsQueue.get(correlationId);
+          if (queueItem && queueItem.type === 'step') {
+            queueItem.hasCreatedEvent = true;
+          }
+          // Continue waiting for step_started/step_completed/step_failed events
+          return EventConsumerResult.Consumed;
+        }
+
         if (event.eventType === 'step_started') {
           // Step has started - so remove from the invocations queue (only on the first "step_started" event)
           if (!hasSeenStepStarted) {
             // O(1) lookup and delete using Map
-            if (ctx.invocationsQueue.has(correlationId)) {
-              ctx.invocationsQueue.delete(correlationId);
-            } else {
-              setTimeout(() => {
-                reject(
-                  new WorkflowRuntimeError(
-                    `Corrupted event log: step ${correlationId} (${stepName}) started but not found in invocation queue`
-                  )
-                );
-              }, 0);
-              return EventConsumerResult.Finished;
-            }
+            // Note: The step may have already been removed by step_created event processing
+            ctx.invocationsQueue.delete(correlationId);
             hasSeenStepStarted = true;
           }
           // If this is a subsequent "step_started" event (after a retry), we just consume it
@@ -105,7 +107,14 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
             // but we will consume the event
             return EventConsumerResult.Consumed;
           }
-        } else if (event.eventType === 'step_completed') {
+        }
+
+        if (event.eventType === 'step_retrying') {
+          // Step is being retried - just consume the event and wait for next step_started
+          return EventConsumerResult.Consumed;
+        }
+
+        if (event.eventType === 'step_completed') {
           // Step has already completed, so resolve the Promise with the cached result
           const hydratedResult = hydrateStepReturnValue(
             event.eventData.result,
@@ -115,17 +124,17 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
             resolve(hydratedResult);
           }, 0);
           return EventConsumerResult.Finished;
-        } else {
-          // An unexpected event type has been received, but it does belong to this step (matching `correlationId`)
-          setTimeout(() => {
-            reject(
-              new WorkflowRuntimeError(
-                `Unexpected event type: "${event.eventType}"`
-              )
-            );
-          }, 0);
-          return EventConsumerResult.Finished;
         }
+
+        // An unexpected event type has been received, but it does belong to this step (matching `correlationId`)
+        setTimeout(() => {
+          reject(
+            new WorkflowRuntimeError(
+              `Unexpected event type: "${event.eventType}"`
+            )
+          );
+        }, 0);
+        return EventConsumerResult.Finished;
       });
 
       return promise;
diff --git a/packages/core/src/workflow.test.ts b/packages/core/src/workflow.test.ts
index 6e7b53787..c150c5e88 100644
--- a/packages/core/src/workflow.test.ts
+++ b/packages/core/src/workflow.test.ts
@@ -144,6 +144,7 @@ describe('runWorkflow', () => {
     expect(hydrateWorkflowReturnValue(result as any, ops)).toEqual(3);
   });
 
+  // Test that timestamps update correctly as events are consumed
   it('should update the timestamp in the vm context as events are replayed', async () => {
     const ops: Promise<any>[] = [];
     const workflowRunId = 'wrun_123';
@@ -158,7 +159,27 @@ describe('runWorkflow', () => {
       deploymentId: 'test-deployment',
     };
 
+    // Events now include run_created, run_started, and step_created for proper consumption
     const events: Event[] = [
+      {
+        eventId: 'event-run-created',
+        runId: workflowRunId,
+        eventType: 'run_created',
+        createdAt: new Date('2024-01-01T00:00:00.000Z'),
+      },
+      {
+        eventId: 'event-run-started',
+        runId: workflowRunId,
+        eventType: 'run_started',
+        createdAt: new Date('2024-01-01T00:00:00.500Z'),
+      },
+      {
+        eventId: 'event-step1-created',
+        runId: workflowRunId,
+        eventType: 'step_created',
+        correlationId: 'step_01HK153X00Y11PCQTCHQRK34HF',
+        createdAt: new Date('2024-01-01T00:00:00.600Z'),
+      },
       {
         eventId: 'event-0',
         runId: workflowRunId,
@@ -176,6 +197,13 @@ describe('runWorkflow', () => {
         },
         createdAt: new Date('2024-01-01T00:00:02.000Z'),
       },
+      {
+        eventId: 'event-step2-created',
+        runId: workflowRunId,
+        eventType: 'step_created',
+        correlationId: 'step_01HK153X00Y11PCQTCHQRK34HG',
+        createdAt: new Date('2024-01-01T00:00:02.500Z'),
+      },
       {
         eventId: 'event-2',
         runId: workflowRunId,
@@ -193,6 +221,13 @@ describe('runWorkflow', () => {
         },
         createdAt: new Date('2024-01-01T00:00:04.000Z'),
       },
+      {
+        eventId: 'event-step3-created',
+        runId: workflowRunId,
+        eventType: 'step_created',
+        correlationId: 'step_01HK153X00Y11PCQTCHQRK34HH',
+        createdAt: new Date('2024-01-01T00:00:04.500Z'),
+      },
       {
         eventId: 'event-4',
         runId: workflowRunId,
@@ -228,10 +263,15 @@ describe('runWorkflow', () => {
       workflowRun,
       events
     );
+    // Timestamps:
+    // - Initial: 0s (from startedAt)
+    // - After step 1 completes (at 2s), timestamp advances to step2_created (2.5s)
+    // - After step 2 completes (at 4s), timestamp advances to step3_created (4.5s)
+    // - After step 3 completes: 6s
     expect(hydrateWorkflowReturnValue(result as any, ops)).toEqual([
       new Date('2024-01-01T00:00:00.000Z'),
-      1704067203000,
-      1704067205000,
+      1704067202500, // 2.5s (step2_created timestamp)
+      1704067204500, // 4.5s (step3_created timestamp)
       new Date('2024-01-01T00:00:06.000Z'),
     ]);
   });
diff --git a/packages/core/src/workflow.ts b/packages/core/src/workflow.ts
index 6ecfba7fd..bd466d302 100644
--- a/packages/core/src/workflow.ts
+++ b/packages/core/src/workflow.ts
@@ -90,6 +90,27 @@ export async function runWorkflow(
       return EventConsumerResult.NotConsumed;
     });
 
+    // Consume run lifecycle events - these are structural events that don't
+    // need special handling in the workflow, but must be consumed to advance
+    // past them in the event log
+    workflowContext.eventsConsumer.subscribe((event) => {
+      if (!event) {
+        return EventConsumerResult.NotConsumed;
+      }
+
+      // Consume run_created - every run has exactly one
+      if (event.eventType === 'run_created') {
+        return EventConsumerResult.Consumed;
+      }
+
+      // Consume run_started - every run has exactly one
+      if (event.eventType === 'run_started') {
+        return EventConsumerResult.Consumed;
+      }
+
+      return EventConsumerResult.NotConsumed;
+    });
+
     const useStep = createUseStep(workflowContext);
     const createHook = createCreateHook(workflowContext);
     const sleep = createSleep(workflowContext);
diff --git a/packages/web-shared/src/api/workflow-server-actions.ts b/packages/web-shared/src/api/workflow-server-actions.ts
index ae6814cd1..ae07e86df 100644
--- a/packages/web-shared/src/api/workflow-server-actions.ts
+++ b/packages/web-shared/src/api/workflow-server-actions.ts
@@ -477,10 +477,12 @@ export async function cancelRun(
 ): Promise<ServerActionResult<void>> {
   try {
     const world = getWorldFromEnv(worldEnv);
-    await world.runs.cancel(runId);
+    await world.events.create(runId, { eventType: 'run_cancelled' });
     return createResponse(undefined);
   } catch (error) {
-    return createServerActionError<void>(error, 'world.runs.cancel', { runId });
+    return createServerActionError<void>(error, 'world.events.create', {
+      runId,
+    });
   }
 }
 
diff --git a/packages/web-shared/src/sidebar/attribute-panel.tsx b/packages/web-shared/src/sidebar/attribute-panel.tsx
index b6adc75bd..0a668c1b0 100644
--- a/packages/web-shared/src/sidebar/attribute-panel.tsx
+++ b/packages/web-shared/src/sidebar/attribute-panel.tsx
@@ -304,11 +304,13 @@ const attributeOrder: AttributeKey[] = [
   'executionContext',
   'createdAt',
   'startedAt',
+  'firstStartedAt',
   'updatedAt',
   'completedAt',
   'expiredAt',
   'retryAfter',
   'error',
+  'lastKnownError',
   'metadata',
   'eventData',
   'input',
@@ -382,6 +384,7 @@ const attributeToDisplayFn: Record<
   // TODO: relative time with tooltips for ISO times
   createdAt: localMillisecondTime,
   startedAt: localMillisecondTime,
+  firstStartedAt: localMillisecondTime,
   updatedAt: localMillisecondTime,
   completedAt: localMillisecondTime,
   expiredAt: localMillisecondTime,
@@ -516,6 +519,67 @@ const attributeToDisplayFn: Record<
       </DetailCard>
     );
   },
+  lastKnownError: (value: unknown) => {
+    // Handle structured error format (same as error, but for step's lastKnownError)
+    if (value && typeof value === 'object' && 'message' in value) {
+      const error = value as {
+        message: string;
+        stack?: string;
+        code?: string;
+      };
+
+      return (
+        <DetailCard summary="Last Known Error">
+          <div className="flex flex-col gap-2">
+            {error.code && (
+              <div>
+                <span
+                  className="text-[11px] font-medium"
+                  style={{ color: 'var(--ds-gray-700)' }}
+                >
+                  Error Code:{' '}
+                </span>
+                <code
+                  className="text-[11px]"
+                  style={{ color: 'var(--ds-gray-1000)' }}
+                >
+                  {error.code}
+                </code>
+              </div>
+            )}
+            <pre
+              className="text-[11px] overflow-x-auto rounded-md border p-3"
+              style={{
+                borderColor: 'var(--ds-gray-300)',
+                backgroundColor: 'var(--ds-gray-100)',
+                color: 'var(--ds-gray-1000)',
+                whiteSpace: 'pre-wrap',
+              }}
+            >
+              <code>{error.stack || error.message}</code>
+            </pre>
+          </div>
+        </DetailCard>
+      );
+    }
+
+    // Fallback for plain string errors
+    return (
+      <DetailCard summary="Last Known Error">
+        <pre
+          className="text-[11px] overflow-x-auto rounded-md border p-3"
+          style={{
+            borderColor: 'var(--ds-gray-300)',
+            backgroundColor: 'var(--ds-gray-100)',
+            color: 'var(--ds-gray-1000)',
+            whiteSpace: 'pre-wrap',
+          }}
+        >
+          <code>{String(value)}</code>
+        </pre>
+      </DetailCard>
+    );
+  },
   eventData: (value: unknown) => {
     return <DetailCard summary="Event Data">{JsonBlock(value)}</DetailCard>;
   },
@@ -525,6 +589,7 @@ const resolvableAttributes = [
   'input',
   'output',
   'error',
+  'lastKnownError',
   'metadata',
   'eventData',
 ];
diff --git a/packages/web-shared/src/workflow-traces/trace-span-construction.ts b/packages/web-shared/src/workflow-traces/trace-span-construction.ts
index 53e4e92d1..74bd4719d 100644
--- a/packages/web-shared/src/workflow-traces/trace-span-construction.ts
+++ b/packages/web-shared/src/workflow-traces/trace-span-construction.ts
@@ -145,7 +145,9 @@ export function stepToSpan(
   // Use createdAt as span start time, with activeStartTime for when execution began
   // This allows visualization of the "queued" period before execution
   const spanStartTime = new Date(step.createdAt);
-  let activeStartTime = step.startedAt ? new Date(step.startedAt) : undefined;
+  let activeStartTime = step.firstStartedAt
+    ? new Date(step.firstStartedAt)
+    : undefined;
   const firstStartEvent = stepEvents.find(
     (event) => event.eventType === 'step_started'
   );
diff --git a/packages/web/src/lib/flow-graph/graph-execution-mapper.ts b/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
index 6f0d33e54..4c8255ac2 100644
--- a/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
+++ b/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
@@ -54,9 +54,9 @@ function createStepExecution(
   }
 
   const duration =
-    attemptStep.completedAt && attemptStep.startedAt
+    attemptStep.completedAt && attemptStep.firstStartedAt
       ? new Date(attemptStep.completedAt).getTime() -
-        new Date(attemptStep.startedAt).getTime()
+        new Date(attemptStep.firstStartedAt).getTime()
       : undefined;
 
   return {
@@ -64,8 +64,8 @@ function createStepExecution(
     stepId: attemptStep.stepId,
     attemptNumber: attemptStep.attempt,
     status,
-    startedAt: attemptStep.startedAt
-      ? new Date(attemptStep.startedAt).toISOString()
+    startedAt: attemptStep.firstStartedAt
+      ? new Date(attemptStep.firstStartedAt).toISOString()
       : undefined,
     completedAt: attemptStep.completedAt
       ? new Date(attemptStep.completedAt).toISOString()
@@ -73,10 +73,10 @@ function createStepExecution(
     duration,
     input: attemptStep.input,
     output: attemptStep.output,
-    error: attemptStep.error
+    error: attemptStep.lastKnownError
       ? {
-          message: attemptStep.error.message,
-          stack: attemptStep.error.stack || '',
+          message: attemptStep.lastKnownError.message,
+          stack: attemptStep.lastKnownError.stack || '',
         }
       : undefined,
   };
diff --git a/packages/world-local/src/storage.test.ts b/packages/world-local/src/storage.test.ts
index c74bb9842..fc392d615 100644
--- a/packages/world-local/src/storage.test.ts
+++ b/packages/world-local/src/storage.test.ts
@@ -1,7 +1,7 @@
 import { promises as fs } from 'node:fs';
 import os from 'node:os';
 import path from 'node:path';
-import type { Storage } from '@workflow/world';
+import type { Storage, WorkflowRun, Step, Hook } from '@workflow/world';
 import { monotonicFactory } from 'ulid';
 import {
   EventSchema,
@@ -12,6 +12,111 @@ import {
 import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
 import { createStorage } from './storage.js';
 
+// Helper functions to create entities through events.create
+async function createRun(
+  storage: Storage,
+  data: {
+    deploymentId: string;
+    workflowName: string;
+    input: unknown[];
+    executionContext?: Record<string, unknown>;
+  }
+): Promise<WorkflowRun> {
+  const result = await storage.events.create(null, {
+    eventType: 'run_created',
+    eventData: data,
+  });
+  if (!result.run) {
+    throw new Error('Expected run to be created');
+  }
+  return result.run;
+}
+
+async function updateRun(
+  storage: Storage,
+  runId: string,
+  eventType: 'run_started' | 'run_completed' | 'run_failed',
+  eventData?: Record<string, unknown>
+): Promise<WorkflowRun> {
+  const result = await storage.events.create(runId, {
+    eventType,
+    eventData,
+  });
+  if (!result.run) {
+    throw new Error('Expected run to be updated');
+  }
+  return result.run;
+}
+
+async function createStep(
+  storage: Storage,
+  runId: string,
+  data: {
+    stepId: string;
+    stepName: string;
+    input: unknown[];
+  }
+): Promise<Step> {
+  const result = await storage.events.create(runId, {
+    eventType: 'step_created',
+    correlationId: data.stepId,
+    eventData: { stepName: data.stepName, input: data.input },
+  });
+  if (!result.step) {
+    throw new Error('Expected step to be created');
+  }
+  return result.step;
+}
+
+async function updateStep(
+  storage: Storage,
+  runId: string,
+  stepId: string,
+  eventType: 'step_started' | 'step_completed' | 'step_failed',
+  eventData?: Record<string, unknown>
+): Promise<Step> {
+  const result = await storage.events.create(runId, {
+    eventType,
+    correlationId: stepId,
+    eventData,
+  });
+  if (!result.step) {
+    throw new Error('Expected step to be updated');
+  }
+  return result.step;
+}
+
+async function createHook(
+  storage: Storage,
+  runId: string,
+  data: {
+    hookId: string;
+    token: string;
+    metadata?: unknown;
+  }
+): Promise<Hook> {
+  const result = await storage.events.create(runId, {
+    eventType: 'hook_created',
+    correlationId: data.hookId,
+    eventData: { token: data.token, metadata: data.metadata },
+  });
+  if (!result.hook) {
+    throw new Error('Expected hook to be created');
+  }
+  return result.hook;
+}
+
+async function disposeHook(
+  storage: Storage,
+  runId: string,
+  hookId: string
+): Promise<void> {
+  await storage.events.create(runId, {
+    eventType: 'hook_disposed',
+    correlationId: hookId,
+  });
+}
+
 describe('Storage', () => {
   let testDir: string;
   let storage: Storage;
@@ -41,7 +146,7 @@ describe('Storage', () => {
           input: ['arg1', 'arg2'],
         };
 
-        const run = await storage.runs.create(runData);
+        const run = await createRun(storage, runData);
 
         expect(run.runId).toMatch(/^wrun_/);
         expect(run.deploymentId).toBe('deployment-123');
@@ -72,7 +177,7 @@ describe('Storage', () => {
           input: [],
         };
 
-        const run = await storage.runs.create(runData);
+        const run = await createRun(storage, runData);
 
         expect(run.executionContext).toBeUndefined();
         expect(run.input).toEqual([]);
@@ -102,7 +207,7 @@ describe('Storage', () => {
 
     describe('get', () => {
       it('should retrieve an existing run', async () => {
-        const created = await storage.runs.create({
+        const created = await createRun(storage, {
           deploymentId: 'deployment-123',
           workflowName: 'test-workflow',
           input: [],
@@ -120,9 +225,9 @@ describe('Storage', () => {
       });
     });
 
-    describe('update', () => {
-      it('should update run status to running', async () => {
-        const created = await storage.runs.create({
+    describe('update via events', () => {
+      it('should update run status to running via run_started event', async () => {
+        const created = await createRun(storage, {
           deploymentId: 'deployment-123',
           workflowName: 'test-workflow',
           input: [],
@@ -131,9 +236,7 @@ describe('Storage', () => {
         // Small delay to ensure different timestamps
         await new Promise((resolve) => setTimeout(resolve, 1));
 
-        const updated = await storage.runs.update(created.runId, {
-          status: 'running',
-        });
+        const updated = await updateRun(storage, created.runId, 'run_started');
 
         expect(updated.status).toBe('running');
         expect(updated.startedAt).toBeInstanceOf(Date);
@@ -142,56 +245,47 @@ describe('Storage', () => {
         );
       });
 
-      it('should update run status to completed', async () => {
-        const created = await storage.runs.create({
+      it('should update run status to completed via run_completed event', async () => {
+        const created = await createRun(storage, {
           deploymentId: 'deployment-123',
           workflowName: 'test-workflow',
           input: [],
         });
 
-        const updated = await storage.runs.update(created.runId, {
-          status: 'completed',
-          output: { result: 'success' },
-        });
+        const updated = await updateRun(
+          storage,
+          created.runId,
+          'run_completed',
+          {
+            output: { result: 'success' },
+          }
+        );
 
         expect(updated.status).toBe('completed');
         expect(updated.output).toEqual({ result: 'success' });
         expect(updated.completedAt).toBeInstanceOf(Date);
       });
 
-      it('should update run status to failed', async () => {
-        const created = await storage.runs.create({
+      it('should update run status to failed via run_failed event', async () => {
+        const created = await createRun(storage, {
           deploymentId: 'deployment-123',
           workflowName: 'test-workflow',
           input: [],
         });
 
-        const updated = await storage.runs.update(created.runId, {
-          status: 'failed',
-          error: {
-            message: 'Something went wrong',
-            code: 'ERR_001',
-          },
+        const updated = await updateRun(storage, created.runId, 'run_failed', {
+          error: 'Something went wrong',
         });
 
         expect(updated.status).toBe('failed');
-        expect(updated.error).toEqual({
-          message: 'Something went wrong',
-          code: 'ERR_001',
-        });
+        expect(updated.error?.message).toBe('Something went wrong');
         expect(updated.completedAt).toBeInstanceOf(Date);
       });
-
-      it('should throw error for non-existent run', async () => {
-        await expect(
-          storage.runs.update('wrun_nonexistent', { status: 'running' })
-        ).rejects.toThrow('Workflow run "wrun_nonexistent" not found');
-      });
     });
 
     describe('list', () => {
       it('should list all runs', async () => {
-        const run1 = await storage.runs.create({
+        const run1 = await createRun(storage, {
           deploymentId: 'deployment-1',
           workflowName: 'workflow-1',
           input: [],
@@ -200,7 +294,7 @@ describe('Storage', () => {
         // Small delay to ensure different timestamps in ULIDs
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const run2 = await storage.runs.create({
+        const run2 = await createRun(storage, {
           deploymentId: 'deployment-2',
           workflowName: 'workflow-2',
           input: [],
@@ -218,12 +312,12 @@ describe('Storage', () => {
       });
 
       it('should filter runs by workflowName', async () => {
-        await storage.runs.create({
+        await createRun(storage, {
           deploymentId: 'deployment-1',
           workflowName: 'workflow-1',
           input: [],
         });
-        const run2 = await storage.runs.create({
+        const run2 = await createRun(storage, {
           deploymentId: 'deployment-2',
           workflowName: 'workflow-2',
           input: [],
@@ -238,7 +332,7 @@ describe('Storage', () => {
       it('should support pagination', async () => {
         // Create multiple runs
         for (let i = 0; i < 5; i++) {
-          await storage.runs.create({
+          await createRun(storage, {
             deploymentId: `deployment-${i}`,
             workflowName: `workflow-${i}`,
             input: [],
@@ -260,58 +354,13 @@ describe('Storage', () => {
         expect(page2.data[0].runId).not.toBe(page1.data[0].runId);
       });
     });
-
-    describe('cancel', () => {
-      it('should cancel a run', async () => {
-        const created = await storage.runs.create({
-          deploymentId: 'deployment-123',
-          workflowName: 'test-workflow',
-          input: [],
-        });
-
-        const cancelled = await storage.runs.cancel(created.runId);
-
-        expect(cancelled.status).toBe('cancelled');
-        expect(cancelled.completedAt).toBeInstanceOf(Date);
-      });
-    });
-
-    describe('pause', () => {
-      it('should pause a run', async () => {
-        const created = await storage.runs.create({
-          deploymentId: 'deployment-123',
-          workflowName: 'test-workflow',
-          input: [],
-        });
-
-        const paused = await storage.runs.pause(created.runId);
-
-        expect(paused.status).toBe('paused');
-      });
-    });
-
-    describe('resume', () => {
-      it('should resume a paused run', async () => {
-        const created = await storage.runs.create({
-          deploymentId: 'deployment-123',
-          workflowName: 'test-workflow',
-          input: [],
-        });
-
-        await storage.runs.pause(created.runId);
-        const resumed = await storage.runs.resume(created.runId);
-
-        expect(resumed.status).toBe('running');
-        expect(resumed.startedAt).toBeInstanceOf(Date);
-      });
-    });
   });
 
   describe('steps', () => {
     let testRunId: string;
 
     beforeEach(async () => {
-      const run = await storage.runs.create({
+      const run = await createRun(storage, {
         deploymentId: 'deployment-123',
         workflowName: 'test-workflow',
         input: [],
@@ -327,7 +376,7 @@ describe('Storage', () => {
           input: ['input1', 'input2'],
         };
 
-        const step = await storage.steps.create(testRunId, stepData);
+        const step = await createStep(storage, testRunId, stepData);
 
         expect(step.runId).toBe(testRunId);
         expect(step.stepId).toBe('step_123');
@@ -335,9 +384,9 @@ describe('Storage', () => {
         expect(step.status).toBe('pending');
         expect(step.input).toEqual(['input1', 'input2']);
         expect(step.output).toBeUndefined();
-        expect(step.error).toBeUndefined();
+        expect(step.lastKnownError).toBeUndefined();
         expect(step.attempt).toBe(0);
-        expect(step.startedAt).toBeUndefined();
+        expect(step.firstStartedAt).toBeUndefined();
         expect(step.completedAt).toBeUndefined();
         expect(step.createdAt).toBeInstanceOf(Date);
         expect(step.updatedAt).toBeInstanceOf(Date);
@@ -380,7 +429,7 @@ describe('Storage', () => {
 
     describe('get', () => {
       it('should retrieve a step with runId and stepId', async () => {
-        const created = await storage.steps.create(testRunId, {
+        const created = await createStep(storage, testRunId, {
           stepId: 'step_123',
           stepName: 'test-step',
           input: ['input1'],
@@ -392,7 +441,7 @@ describe('Storage', () => {
       });
 
       it('should retrieve a step with only stepId', async () => {
-        const created = await storage.steps.create(testRunId, {
+        const created = await createStep(storage, testRunId, {
           stepId: 'unique_step_123',
           stepName: 'test-step',
           input: ['input1'],
@@ -410,83 +459,76 @@ describe('Storage', () => {
       });
     });
 
-    describe('update', () => {
-      it('should update step status to running', async () => {
-        await storage.steps.create(testRunId, {
+    describe('update via events', () => {
+      it('should update step status to running via step_started event', async () => {
+        await createStep(storage, testRunId, {
           stepId: 'step_123',
           stepName: 'test-step',
           input: ['input1'],
         });
 
-        const updated = await storage.steps.update(testRunId, 'step_123', {
-          status: 'running',
-        });
+        const updated = await updateStep(
+          storage,
+          testRunId,
+          'step_123',
+          'step_started',
+          {} // step_started no longer needs attempt in eventData - World increments it
+        );
 
         expect(updated.status).toBe('running');
-        expect(updated.startedAt).toBeInstanceOf(Date);
+        expect(updated.firstStartedAt).toBeInstanceOf(Date);
+        expect(updated.attempt).toBe(1); // Incremented by step_started
       });
 
-      it('should update step status to completed', async () => {
-        await storage.steps.create(testRunId, {
+      it('should update step status to completed via step_completed event', async () => {
+        await createStep(storage, testRunId, {
           stepId: 'step_123',
           stepName: 'test-step',
           input: ['input1'],
         });
 
-        const updated = await storage.steps.update(testRunId, 'step_123', {
-          status: 'completed',
-          output: { result: 'done' },
-        });
+        const updated = await updateStep(
+          storage,
+          testRunId,
+          'step_123',
+          'step_completed',
+          { result: { result: 'done' } }
+        );
 
         expect(updated.status).toBe('completed');
         expect(updated.output).toEqual({ result: 'done' });
         expect(updated.completedAt).toBeInstanceOf(Date);
       });
 
-      it('should update step status to failed', async () => {
-        await storage.steps.create(testRunId, {
+      it('should update step status to failed via step_failed event', async () => {
+        await createStep(storage, testRunId, {
           stepId: 'step_123',
           stepName: 'test-step',
           input: ['input1'],
         });
 
-        const updated = await storage.steps.update(testRunId, 'step_123', {
-          status: 'failed',
-          error: {
-            message: 'Step failed',
-            code: 'STEP_ERR',
-          },
-        });
+        const updated = await updateStep(
+          storage,
+          testRunId,
+          'step_123',
+          'step_failed',
+          { error: 'Step failed', fatal: true }
+        );
 
         expect(updated.status).toBe('failed');
-        expect(updated.error?.message).toBe('Step failed');
-        expect(updated.error?.code).toBe('STEP_ERR');
+        expect(updated.lastKnownError?.message).toBe('Step failed');
         expect(updated.completedAt).toBeInstanceOf(Date);
       });
-
-      it('should update attempt count', async () => {
-        await storage.steps.create(testRunId, {
-          stepId: 'step_123',
-          stepName: 'test-step',
-          input: ['input1'],
-        });
-
-        const updated = await storage.steps.update(testRunId, 'step_123', {
-          attempt: 2,
-        });
-
-        expect(updated.attempt).toBe(2);
-      });
     });
 
     describe('list', () => {
       it('should list all steps for a run', async () => {
-        const step1 = await storage.steps.create(testRunId, {
+        const step1 = await createStep(storage, testRunId, {
           stepId: 'step_1',
           stepName: 'first-step',
           input: [],
         });
-        const step2 = await storage.steps.create(testRunId, {
+        const step2 = await createStep(storage, testRunId, {
           stepId: 'step_2',
           stepName: 'second-step',
           input: [],
@@ -508,7 +550,7 @@ describe('Storage', () => {
       it('should support pagination', async () => {
         // Create multiple steps
         for (let i = 0; i < 5; i++) {
-          await storage.steps.create(testRunId, {
+          await createStep(storage, testRunId, {
             stepId: `step_${i}`,
             stepName: `step-${i}`,
             input: [],
@@ -535,7 +577,7 @@ describe('Storage', () => {
       it('should handle pagination when new items are created after getting a cursor', async () => {
         // Create initial set of items (4 items)
         for (let i = 0; i < 4; i++) {
-          await storage.steps.create(testRunId, {
+          await createStep(storage, testRunId, {
             stepId: `step_${i}`,
             stepName: `step-${i}`,
             input: [],
@@ -555,7 +597,7 @@ describe('Storage', () => {
 
         // Now create 4 more items (total: 8 items)
         for (let i = 4; i < 8; i++) {
-          await storage.steps.create(testRunId, {
+          await createStep(storage, testRunId, {
             stepId: `step_${i}`,
             stepName: `step-${i}`,
             input: [],
@@ -595,7 +637,7 @@ describe('Storage', () => {
       it('should handle pagination with cursor after items are added mid-pagination', async () => {
         // Create initial 4 items
         for (let i = 0; i < 4; i++) {
-          await storage.steps.create(testRunId, {
+          await createStep(storage, testRunId, {
             stepId: `step_${i}`,
             stepName: `step-${i}`,
             input: [],
@@ -627,7 +669,7 @@ describe('Storage', () => {
 
         // Now add 4 more items (total: 8)
         for (let i = 4; i < 8; i++) {
-          await storage.steps.create(testRunId, {
+          await createStep(storage, testRunId, {
             stepId: `step_${i}`,
             stepName: `step-${i}`,
             input: [],
@@ -668,7 +710,7 @@ describe('Storage', () => {
 
         // Start with X items (4 items)
         for (let i = 0; i < 4; i++) {
-          await storage.steps.create(testRunId, {
+          await createStep(storage, testRunId, {
             stepId: `step_${i}`,
             stepName: `step-${i}`,
             input: [],
@@ -690,7 +732,7 @@ describe('Storage', () => {
 
         // Create new items (total becomes 2X = 8 items)
         for (let i = 4; i < 8; i++) {
-          await storage.steps.create(testRunId, {
+          await createStep(storage, testRunId, {
             stepId: `step_${i}`,
             stepName: `step-${i}`,
             input: [],
@@ -742,7 +784,7 @@ describe('Storage', () => {
     let testRunId: string;
 
     beforeEach(async () => {
-      const run = await storage.runs.create({
+      const run = await createRun(storage, {
         deploymentId: 'deployment-123',
         workflowName: 'test-workflow',
         input: [],
@@ -757,7 +799,7 @@ describe('Storage', () => {
           correlationId: 'corr_123',
         };
 
-        const event = await storage.events.create(testRunId, eventData);
+        const { event } = await storage.events.create(testRunId, eventData);
 
         expect(event.runId).toBe(testRunId);
         expect(event.eventId).toMatch(/^evnt_/);
@@ -783,7 +825,7 @@ describe('Storage', () => {
           eventType: 'workflow_completed' as const,
         };
 
-        const event = await storage.events.create(testRunId, eventData);
+        const { event } = await storage.events.create(testRunId, eventData);
 
         expect(event.eventType).toBe('workflow_completed');
         expect(event.correlationId).toBeUndefined();
@@ -812,14 +854,15 @@ describe('Storage', () => {
 
     describe('list', () => {
       it('should list all events for a run', async () => {
-        const event1 = await storage.events.create(testRunId, {
+        // Note: testRunId was created via createRun which creates a run_created event
+        const { event: event1 } = await storage.events.create(testRunId, {
           eventType: 'workflow_started' as const,
         });
 
         // Small delay to ensure different timestamps in event IDs
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await storage.events.create(testRunId, {
+        const { event: event2 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId: 'corr_step_1',
         });
@@ -829,24 +872,27 @@ describe('Storage', () => {
           pagination: { sortOrder: 'asc' }, // Explicitly request ascending order
         });
 
-        expect(result.data).toHaveLength(2);
+        // 3 events: run_created (from createRun), workflow_started, step_started
+        expect(result.data).toHaveLength(3);
         // Should be in chronological order (oldest first)
-        expect(result.data[0].eventId).toBe(event1.eventId);
-        expect(result.data[1].eventId).toBe(event2.eventId);
-        expect(result.data[1].createdAt.getTime()).toBeGreaterThanOrEqual(
-          result.data[0].createdAt.getTime()
+        expect(result.data[0].eventType).toBe('run_created');
+        expect(result.data[1].eventId).toBe(event1.eventId);
+        expect(result.data[2].eventId).toBe(event2.eventId);
+        expect(result.data[2].createdAt.getTime()).toBeGreaterThanOrEqual(
+          result.data[1].createdAt.getTime()
         );
       });
 
       it('should list events in descending order when explicitly requested (newest first)', async () => {
-        const event1 = await storage.events.create(testRunId, {
+        // Note: testRunId was created via createRun which creates a run_created event
+        const { event: event1 } = await storage.events.create(testRunId, {
           eventType: 'workflow_started' as const,
         });
 
         // Small delay to ensure different timestamps in event IDs
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await storage.events.create(testRunId, {
+        const { event: event2 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId: 'corr_step_1',
         });
@@ -856,10 +902,12 @@ describe('Storage', () => {
           pagination: { sortOrder: 'desc' },
         });
 
-        expect(result.data).toHaveLength(2);
+        // 3 events: run_created (from createRun), workflow_started, step_started
+        expect(result.data).toHaveLength(3);
         // Should be in reverse chronological order (newest first)
         expect(result.data[0].eventId).toBe(event2.eventId);
         expect(result.data[1].eventId).toBe(event1.eventId);
+        expect(result.data[2].eventType).toBe('run_created');
         expect(result.data[0].createdAt.getTime()).toBeGreaterThanOrEqual(
           result.data[1].createdAt.getTime()
         );
@@ -898,14 +946,14 @@ describe('Storage', () => {
         const correlationId = 'step-abc123';
 
         // Create events with the target correlation ID
-        const event1 = await storage.events.create(testRunId, {
+        const { event: event1 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId,
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await storage.events.create(testRunId, {
+        const { event: event2 } = await storage.events.create(testRunId, {
           eventType: 'step_completed' as const,
           correlationId,
           eventData: { result: 'success' },
@@ -936,21 +984,22 @@ describe('Storage', () => {
         const correlationId = 'hook-xyz789';
 
         // Create another run
-        const run2 = await storage.runs.create({
+        const run2 = await createRun(storage, {
           deploymentId: 'deployment-456',
           workflowName: 'test-workflow-2',
           input: [],
         });
 
         // Create events in both runs with same correlation ID
-        const event1 = await storage.events.create(testRunId, {
+        const { event: event1 } = await storage.events.create(testRunId, {
           eventType: 'hook_created' as const,
           correlationId,
+          eventData: { token: `test-token-${correlationId}`, metadata: {} },
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await storage.events.create(run2.runId, {
+        const { event: event2 } = await storage.events.create(run2.runId, {
           eventType: 'hook_received' as const,
           correlationId,
           eventData: { payload: { data: 'test' } },
@@ -958,7 +1007,7 @@ describe('Storage', () => {
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event3 = await storage.events.create(testRunId, {
+        const { event: event3 } = await storage.events.create(testRunId, {
           eventType: 'hook_disposed' as const,
           correlationId,
         });
@@ -1062,14 +1111,14 @@ describe('Storage', () => {
         const correlationId = 'step-ordering';
 
         // Create events with slight delays to ensure different timestamps
-        const event1 = await storage.events.create(testRunId, {
+        const { event: event1 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId,
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await storage.events.create(testRunId, {
+        const { event: event2 } = await storage.events.create(testRunId, {
           eventType: 'step_completed' as const,
           correlationId,
           eventData: { result: 'success' },
@@ -1091,14 +1140,14 @@ describe('Storage', () => {
       it('should support descending order', async () => {
         const correlationId = 'step-desc-order';
 
-        const event1 = await storage.events.create(testRunId, {
+        const { event: event1 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId,
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await storage.events.create(testRunId, {
+        const { event: event2 } = await storage.events.create(testRunId, {
           eventType: 'step_completed' as const,
           correlationId,
           eventData: { result: 'success' },
@@ -1121,14 +1170,15 @@ describe('Storage', () => {
         const hookId = 'hook_test123';
 
         // Create a typical hook lifecycle
-        const created = await storage.events.create(testRunId, {
+        const { event: created } = await storage.events.create(testRunId, {
           eventType: 'hook_created' as const,
           correlationId: hookId,
+          eventData: { token: `test-token-${hookId}`, metadata: {} },
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const received1 = await storage.events.create(testRunId, {
+        const { event: received1 } = await storage.events.create(testRunId, {
           eventType: 'hook_received' as const,
           correlationId: hookId,
           eventData: { payload: { request: 1 } },
@@ -1136,7 +1186,7 @@ describe('Storage', () => {
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const received2 = await storage.events.create(testRunId, {
+        const { event: received2 } = await storage.events.create(testRunId, {
           eventType: 'hook_received' as const,
           correlationId: hookId,
           eventData: { payload: { request: 2 } },
@@ -1144,7 +1194,7 @@ describe('Storage', () => {
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const disposed = await storage.events.create(testRunId, {
+        const { event: disposed } = await storage.events.create(testRunId, {
           eventType: 'hook_disposed' as const,
           correlationId: hookId,
         });
@@ -1171,7 +1221,7 @@ describe('Storage', () => {
     let testRunId: string;
 
     beforeEach(async () => {
-      const run = await storage.runs.create({
+      const run = await createRun(storage, {
         deploymentId: 'deployment-123',
         workflowName: 'test-workflow',
         input: [],
@@ -1186,14 +1236,11 @@ describe('Storage', () => {
           token: 'my-hook-token',
         };
 
-        const hook = await storage.hooks.create(testRunId, hookData);
+        const hook = await createHook(storage, testRunId, hookData);
 
         expect(hook.runId).toBe(testRunId);
         expect(hook.hookId).toBe('hook_123');
         expect(hook.token).toBe('my-hook-token');
-        expect(hook.ownerId).toBe('local-owner');
-        expect(hook.projectId).toBe('local-project');
-        expect(hook.environment).toBe('local');
         expect(hook.createdAt).toBeInstanceOf(Date);
 
         // Verify file was created
@@ -1212,7 +1259,7 @@ describe('Storage', () => {
           token: 'duplicate-test-token',
         };
 
-        await storage.hooks.create(testRunId, hookData);
+        await createHook(storage, testRunId, hookData);
 
         // Try to create another hook with the same token
         const duplicateHookData = {
@@ -1221,19 +1268,19 @@ describe('Storage', () => {
         };
 
         await expect(
-          storage.hooks.create(testRunId, duplicateHookData)
+          createHook(storage, testRunId, duplicateHookData)
         ).rejects.toThrow(
           'Hook with token duplicate-test-token already exists for this project'
         );
       });
 
       it('should allow multiple hooks with different tokens for the same run', async () => {
-        const hook1 = await storage.hooks.create(testRunId, {
+        const hook1 = await createHook(storage, testRunId, {
           hookId: 'hook_1',
           token: 'token-1',
         });
 
-        const hook2 = await storage.hooks.create(testRunId, {
+        const hook2 = await createHook(storage, testRunId, {
           hookId: 'hook_2',
           token: 'token-2',
         });
@@ -1246,7 +1293,7 @@ describe('Storage', () => {
         const token = 'reusable-token';
 
         // Create first hook
-        const hook1 = await storage.hooks.create(testRunId, {
+        const hook1 = await createHook(storage, testRunId, {
           hookId: 'hook_1',
           token,
         });
@@ -1255,7 +1302,7 @@ describe('Storage', () => {
 
         // Try to create another hook with the same token - should fail
         await expect(
-          storage.hooks.create(testRunId, {
+          createHook(storage, testRunId, {
             hookId: 'hook_2',
             token,
           })
@@ -1263,11 +1310,11 @@ describe('Storage', () => {
           `Hook with token ${token} already exists for this project`
         );
 
-        // Dispose the first hook
-        await storage.hooks.dispose('hook_1');
+        // Dispose the first hook via hook_disposed event
+        await disposeHook(storage, testRunId, 'hook_1');
 
         // Now we should be able to create a new hook with the same token
-        const hook2 = await storage.hooks.create(testRunId, {
+        const hook2 = await createHook(storage, testRunId, {
           hookId: 'hook_2',
           token,
         });
@@ -1278,7 +1325,7 @@ describe('Storage', () => {
 
       it('should enforce token uniqueness across different runs within the same project', async () => {
         // Create a second run
-        const run2 = await storage.runs.create({
+        const run2 = await createRun(storage, {
           deploymentId: 'deployment-456',
           workflowName: 'another-workflow',
           input: [],
@@ -1287,7 +1334,7 @@ describe('Storage', () => {
         const token = 'shared-token-across-runs';
 
         // Create hook in first run
-        const hook1 = await storage.hooks.create(testRunId, {
+        const hook1 = await createHook(storage, testRunId, {
           hookId: 'hook_1',
           token,
         });
@@ -1296,7 +1343,7 @@ describe('Storage', () => {
 
         // Try to create hook with same token in second run - should fail
         await expect(
-          storage.hooks.create(run2.runId, {
+          createHook(storage, run2.runId, {
             hookId: 'hook_2',
             token,
           })
@@ -1328,7 +1375,7 @@ describe('Storage', () => {
 
     describe('get', () => {
       it('should retrieve an existing hook by hookId', async () => {
-        const created = await storage.hooks.create(testRunId, {
+        const created = await createHook(storage, testRunId, {
           hookId: 'hook_123',
           token: 'test-token-123',
         });
@@ -1345,7 +1392,7 @@ describe('Storage', () => {
       });
 
       it('should respect resolveData option', async () => {
-        const created = await storage.hooks.create(testRunId, {
+        const created = await createHook(storage, testRunId, {
           hookId: 'hook_with_response',
           token: 'test-token',
         });
@@ -1367,7 +1414,7 @@ describe('Storage', () => {
 
     describe('getByToken', () => {
       it('should retrieve an existing hook by token', async () => {
-        const created = await storage.hooks.create(testRunId, {
+        const created = await createHook(storage, testRunId, {
           hookId: 'hook_123',
           token: 'test-token-123',
         });
@@ -1384,15 +1431,15 @@ describe('Storage', () => {
       });
 
       it('should find the correct hook when multiple hooks exist', async () => {
-        const hook1 = await storage.hooks.create(testRunId, {
+        const hook1 = await createHook(storage, testRunId, {
           hookId: 'hook_1',
           token: 'token-1',
         });
-        await storage.hooks.create(testRunId, {
+        await createHook(storage, testRunId, {
           hookId: 'hook_2',
           token: 'token-2',
         });
-        await storage.hooks.create(testRunId, {
+        await createHook(storage, testRunId, {
           hookId: 'hook_3',
           token: 'token-3',
         });
@@ -1406,7 +1453,7 @@ describe('Storage', () => {
 
     describe('list', () => {
       it('should list all hooks', async () => {
-        const hook1 = await storage.hooks.create(testRunId, {
+        const hook1 = await createHook(storage, testRunId, {
           hookId: 'hook_1',
           token: 'token-1',
         });
@@ -1414,7 +1461,7 @@ describe('Storage', () => {
         // Small delay to ensure different timestamps
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const hook2 = await storage.hooks.create(testRunId, {
+        const hook2 = await createHook(storage, testRunId, {
           hookId: 'hook_2',
           token: 'token-2',
         });
@@ -1432,17 +1479,17 @@ describe('Storage', () => {
 
       it('should filter hooks by runId', async () => {
         // Create a second run
-        const run2 = await storage.runs.create({
+        const run2 = await createRun(storage, {
           deploymentId: 'deployment-456',
           workflowName: 'test-workflow-2',
           input: [],
         });
 
-        await storage.hooks.create(testRunId, {
+        await createHook(storage, testRunId, {
           hookId: 'hook_run1',
           token: 'token-run1',
         });
-        const hook2 = await storage.hooks.create(run2.runId, {
+        const hook2 = await createHook(storage, run2.runId, {
           hookId: 'hook_run2',
           token: 'token-run2',
         });
@@ -1457,7 +1504,7 @@ describe('Storage', () => {
       it('should support pagination', async () => {
         // Create multiple hooks
         for (let i = 0; i < 5; i++) {
-          await storage.hooks.create(testRunId, {
+          await createHook(storage, testRunId, {
             hookId: `hook_${i}`,
             token: `token-${i}`,
           });
@@ -1480,14 +1527,14 @@ describe('Storage', () => {
       });
 
       it('should support ascending sort order', async () => {
-        const hook1 = await storage.hooks.create(testRunId, {
+        const hook1 = await createHook(storage, testRunId, {
           hookId: 'hook_1',
           token: 'token-1',
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const hook2 = await storage.hooks.create(testRunId, {
+        const hook2 = await createHook(storage, testRunId, {
           hookId: 'hook_2',
           token: 'token-2',
         });
@@ -1503,7 +1550,7 @@ describe('Storage', () => {
       });
 
       it('should respect resolveData option', async () => {
-        await storage.hooks.create(testRunId, {
+        await createHook(storage, testRunId, {
           hookId: 'hook_with_response',
           token: 'token-with-response',
         });
@@ -1531,29 +1578,5 @@ describe('Storage', () => {
         expect(result.hasMore).toBe(false);
       });
     });
-
-    describe('dispose', () => {
-      it('should delete an existing hook', async () => {
-        const created = await storage.hooks.create(testRunId, {
-          hookId: 'hook_to_delete',
-          token: 'token-to-delete',
-        });
-
-        const disposed = await storage.hooks.dispose('hook_to_delete');
-
-        expect(disposed).toEqual(created);
-
-        // Verify file was deleted
-        await expect(
-          storage.hooks.getByToken('token-to-delete')
-        ).rejects.toThrow('Hook with token token-to-delete not found');
-      });
-
-      it('should throw error for non-existent hook', async () => {
-        await expect(storage.hooks.dispose('hook_nonexistent')).rejects.toThrow(
-          'Hook hook_nonexistent not found'
-        );
-      });
-    });
   });
 });
diff --git a/packages/world-local/src/storage.ts b/packages/world-local/src/storage.ts
index 46485e7d8..0ad585dfb 100644
--- a/packages/world-local/src/storage.ts
+++ b/packages/world-local/src/storage.ts
@@ -1,8 +1,8 @@
 import path from 'node:path';
 import { WorkflowRunNotFoundError } from '@workflow/errors';
 import {
-  type CreateHookRequest,
   type Event,
+  type EventResult,
   EventSchema,
   type GetHookParams,
   type Hook,
@@ -102,7 +102,7 @@ const getObjectCreatedAt =
  * Implements the Storage['hooks'] interface with hook CRUD operations.
  */
 function createHooksStorage(basedir: string): Storage['hooks'] {
-  // Helper function to find a hook by token (shared between create and getByToken)
+  // Helper function to find a hook by token (shared between getByToken)
   async function findHookByToken(token: string): Promise<Hook | null> {
     const hooksDir = path.join(basedir, 'hooks');
     const files = await listJSONFiles(hooksDir);
@@ -118,35 +118,6 @@ function createHooksStorage(basedir: string): Storage['hooks'] {
     return null;
   }
 
-  async function create(runId: string, data: CreateHookRequest): Promise<Hook> {
-    // Check if a hook with the same token already exists
-    // Token uniqueness is enforced globally per local environment
-    const existingHook = await findHookByToken(data.token);
-    if (existingHook) {
-      throw new Error(
-        `Hook with token ${data.token} already exists for this project`
-      );
-    }
-
-    const now = new Date();
-
-    const result = {
-      runId,
-      hookId: data.hookId,
-      token: data.token,
-      metadata: data.metadata,
-      ownerId: 'local-owner',
-      projectId: 'local-project',
-      environment: 'local',
-      createdAt: now,
-    } as Hook;
-
-    const hookPath = path.join(basedir, 'hooks', `${data.hookId}.json`);
-    HookSchema.parse(result);
-    await writeJSON(hookPath, result);
-    return result;
-  }
-
   async function get(hookId: string, params?: GetHookParams): Promise<Hook> {
     const hookPath = path.join(basedir, 'hooks', `${hookId}.json`);
     const hook = await readJSON(hookPath, HookSchema);
@@ -202,17 +173,7 @@ function createHooksStorage(basedir: string): Storage['hooks'] {
     };
   }
 
-  async function dispose(hookId: string): Promise<Hook> {
-    const hookPath = path.join(basedir, 'hooks', `${hookId}.json`);
-    const hook = await readJSON(hookPath, HookSchema);
-    if (!hook) {
-      throw new Error(`Hook ${hookId} not found`);
-    }
-    await deleteJSON(hookPath);
-    return hook;
-  }
-
-  return { create, get, getByToken, list, dispose };
+  return { get, getByToken, list };
 }
 
 /**
@@ -237,33 +198,6 @@ async function deleteAllHooksForRun(
 export function createStorage(basedir: string): Storage {
   return {
     runs: {
-      async create(data) {
-        const runId = `wrun_${monotonicUlid()}`;
-        const now = new Date();
-
-        const result: WorkflowRun = {
-          runId,
-          deploymentId: data.deploymentId,
-          status: 'pending',
-          workflowName: data.workflowName,
-          executionContext: data.executionContext as
-            | Record<string, any>
-            | undefined,
-          input: (data.input as any[]) || [],
-          output: undefined,
-          error: undefined,
-          startedAt: undefined,
-          completedAt: undefined,
-          createdAt: now,
-          updatedAt: now,
-        };
-
-        const runPath = path.join(basedir, 'runs', `${runId}.json`);
-        WorkflowRunSchema.parse(result);
-        await writeJSON(runPath, result);
-        return result;
-      },
-
       async get(id, params) {
         const runPath = path.join(basedir, 'runs', `${id}.json`);
         const run = await readJSON(runPath, WorkflowRunSchema);
@@ -274,54 +208,6 @@ export function createStorage(basedir: string): Storage {
         return filterRunData(run, resolveData);
       },
 
-      /**
-       * Updates a workflow run.
-       *
-       * Note: This operation is not atomic. Concurrent updates from multiple
-       * processes may result in lost updates (last writer wins). This is an
-       * inherent limitation of filesystem-based storage without locking.
-       * For the local world, this is acceptable as it's typically
-       * used in single-process scenarios.
-       */
-      async update(id, data) {
-        const runPath = path.join(basedir, 'runs', `${id}.json`);
-        const run = await readJSON(runPath, WorkflowRunSchema);
-        if (!run) {
-          throw new WorkflowRunNotFoundError(id);
-        }
-
-        const now = new Date();
-        const updatedRun = {
-          ...run,
-          ...data,
-          updatedAt: now,
-        } as WorkflowRun;
-
-        // Only set startedAt the first time the run transitions to 'running'
-        if (data.status === 'running' && !updatedRun.startedAt) {
-          updatedRun.startedAt = now;
-        }
-
-        const isBecomingTerminal =
-          data.status === 'completed' ||
-          data.status === 'failed' ||
-          data.status === 'cancelled';
-
-        if (isBecomingTerminal) {
-          updatedRun.completedAt = now;
-        }
-
-        WorkflowRunSchema.parse(updatedRun);
-        await writeJSON(runPath, updatedRun, { overwrite: true });
-
-        // If transitioning to a terminal status, clean up all hooks for this run
-        if (isBecomingTerminal) {
-          await deleteAllHooksForRun(basedir, id);
-        }
-
-        return updatedRun;
-      },
-
       async list(params) {
         const resolveData = params?.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
         const result = await paginatedFileSystemQuery({
@@ -360,54 +246,9 @@ export function createStorage(basedir: string): Storage {
 
         return result;
       },
-
-      async cancel(id, params) {
-        // This will call update which triggers hook cleanup automatically
-        const run = await this.update(id, { status: 'cancelled' });
-        const resolveData = params?.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
-        return filterRunData(run, resolveData);
-      },
-
-      async pause(id, params) {
-        const run = await this.update(id, { status: 'paused' });
-        const resolveData = params?.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
-        return filterRunData(run, resolveData);
-      },
-
-      async resume(id, params) {
-        const run = await this.update(id, { status: 'running' });
-        const resolveData = params?.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
-        return filterRunData(run, resolveData);
-      },
     },
 
     steps: {
-      async create(runId, data) {
-        const now = new Date();
-
-        const result: Step = {
-          runId,
-          stepId: data.stepId,
-          stepName: data.stepName,
-          status: 'pending',
-          input: data.input as any[],
-          output: undefined,
-          error: undefined,
-          attempt: 0,
-          startedAt: undefined,
-          completedAt: undefined,
-          createdAt: now,
-          updatedAt: now,
-        };
-
-        const compositeKey = `${runId}-${data.stepId}`;
-        const stepPath = path.join(basedir, 'steps', `${compositeKey}.json`);
-        StepSchema.parse(result);
-        await writeJSON(stepPath, result);
-
-        return result;
-      },
-
       async get(
         runId: string | undefined,
         stepId: string,
@@ -433,41 +274,6 @@ export function createStorage(basedir: string): Storage {
         return filterStepData(step, resolveData);
       },
 
-      /**
-       * Updates a step.
-       *
-       * Note: This operation is not atomic. Concurrent updates from multiple
-       * processes may result in lost updates (last writer wins). This is an
-       * inherent limitation of filesystem-based storage without locking.
-       */
-      async update(runId, stepId, data) {
-        const compositeKey = `${runId}-${stepId}`;
-        const stepPath = path.join(basedir, 'steps', `${compositeKey}.json`);
-        const step = await readJSON(stepPath, StepSchema);
-        if (!step) {
-          throw new Error(`Step ${stepId} in run ${runId} not found`);
-        }
-
-        const now = new Date();
-        const updatedStep: Step = {
-          ...step,
-          ...data,
-          updatedAt: now,
-        };
-
-        // Only set startedAt the first time the step transitions to 'running'
-        if (data.status === 'running' && !updatedStep.startedAt) {
-          updatedStep.startedAt = now;
-        }
-        if (data.status === 'completed' || data.status === 'failed') {
-          updatedStep.completedAt = now;
-        }
-
-        StepSchema.parse(updatedStep);
-        await writeJSON(stepPath, updatedStep, { overwrite: true });
-        return updatedStep;
-      },
-
       async list(params) {
         const resolveData = params.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
         const result = await paginatedFileSystemQuery({
@@ -499,25 +305,409 @@ export function createStorage(basedir: string): Storage {
 
     // Events - filesystem-backed storage
     events: {
-      async create(runId, data, params) {
+      async create(runId, data, params): Promise<EventResult> {
         const eventId = `evnt_${monotonicUlid()}`;
         const now = new Date();
 
-        const result: Event = {
+        // For run_created events, generate runId server-side if null or empty
+        let effectiveRunId: string;
+        if (data.eventType === 'run_created' && (!runId || runId === '')) {
+          effectiveRunId = `wrun_${monotonicUlid()}`;
+        } else if (!runId) {
+          throw new Error('runId is required for non-run_created events');
+        } else {
+          effectiveRunId = runId;
+        }
+
+        const event: Event = {
           ...data,
-          runId,
+          runId: effectiveRunId,
           eventId,
           createdAt: now,
         };
 
+        // Track entity created/updated for EventResult
+        let run: WorkflowRun | undefined;
+        let step: Step | undefined;
+        let hook: Hook | undefined;
+
+        // Create/update entity based on event type (event-sourced architecture)
+        // Run lifecycle events
+        if (data.eventType === 'run_created' && 'eventData' in data) {
+          const runData = data.eventData as {
+            deploymentId: string;
+            workflowName: string;
+            input: any[];
+            executionContext?: Record<string, any>;
+          };
+          run = {
+            runId: effectiveRunId,
+            deploymentId: runData.deploymentId,
+            status: 'pending',
+            workflowName: runData.workflowName,
+            executionContext: runData.executionContext,
+            input: runData.input || [],
+            output: undefined,
+            error: undefined,
+            startedAt: undefined,
+            completedAt: undefined,
+            createdAt: now,
+            updatedAt: now,
+          };
+          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
+          await writeJSON(runPath, run);
+        } else if (data.eventType === 'run_started') {
+          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
+          const existingRun = await readJSON(runPath, WorkflowRunSchema);
+          if (existingRun) {
+            run = {
+              runId: existingRun.runId,
+              deploymentId: existingRun.deploymentId,
+              workflowName: existingRun.workflowName,
+              executionContext: existingRun.executionContext,
+              input: existingRun.input,
+              createdAt: existingRun.createdAt,
+              expiredAt: existingRun.expiredAt,
+              status: 'running',
+              output: undefined,
+              error: undefined,
+              completedAt: undefined,
+              startedAt: existingRun.startedAt ?? now,
+              updatedAt: now,
+            };
+            await writeJSON(runPath, run, { overwrite: true });
+          }
+        } else if (data.eventType === 'run_completed' && 'eventData' in data) {
+          const completedData = data.eventData as { output?: any };
+          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
+          const existingRun = await readJSON(runPath, WorkflowRunSchema);
+          if (existingRun) {
+            run = {
+              runId: existingRun.runId,
+              deploymentId: existingRun.deploymentId,
+              workflowName: existingRun.workflowName,
+              executionContext: existingRun.executionContext,
+              input: existingRun.input,
+              createdAt: existingRun.createdAt,
+              expiredAt: existingRun.expiredAt,
+              startedAt: existingRun.startedAt,
+              status: 'completed',
+              output: completedData.output,
+              error: undefined,
+              completedAt: now,
+              updatedAt: now,
+            };
+            await writeJSON(runPath, run, { overwrite: true });
+            await deleteAllHooksForRun(basedir, effectiveRunId);
+          }
+        } else if (data.eventType === 'run_failed' && 'eventData' in data) {
+          const failedData = data.eventData as {
+            error: any;
+            errorCode?: string;
+          };
+          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
+          const existingRun = await readJSON(runPath, WorkflowRunSchema);
+          if (existingRun) {
+            run = {
+              runId: existingRun.runId,
+              deploymentId: existingRun.deploymentId,
+              workflowName: existingRun.workflowName,
+              executionContext: existingRun.executionContext,
+              input: existingRun.input,
+              createdAt: existingRun.createdAt,
+              expiredAt: existingRun.expiredAt,
+              startedAt: existingRun.startedAt,
+              status: 'failed',
+              output: undefined,
+              error: {
+                message:
+                  typeof failedData.error === 'string'
+                    ? failedData.error
+                    : (failedData.error?.message ?? 'Unknown error'),
+                stack: failedData.error?.stack,
+                code: failedData.errorCode,
+              },
+              completedAt: now,
+              updatedAt: now,
+            };
+            await writeJSON(runPath, run, { overwrite: true });
+            await deleteAllHooksForRun(basedir, effectiveRunId);
+          }
+        } else if (data.eventType === 'run_cancelled') {
+          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
+          const existingRun = await readJSON(runPath, WorkflowRunSchema);
+          if (existingRun) {
+            run = {
+              runId: existingRun.runId,
+              deploymentId: existingRun.deploymentId,
+              workflowName: existingRun.workflowName,
+              executionContext: existingRun.executionContext,
+              input: existingRun.input,
+              createdAt: existingRun.createdAt,
+              expiredAt: existingRun.expiredAt,
+              startedAt: existingRun.startedAt,
+              status: 'cancelled',
+              output: undefined,
+              error: undefined,
+              completedAt: now,
+              updatedAt: now,
+            };
+            await writeJSON(runPath, run, { overwrite: true });
+            await deleteAllHooksForRun(basedir, effectiveRunId);
+          }
+        } else if (data.eventType === 'run_paused') {
+          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
+          const existingRun = await readJSON(runPath, WorkflowRunSchema);
+          if (existingRun) {
+            run = {
+              runId: existingRun.runId,
+              deploymentId: existingRun.deploymentId,
+              workflowName: existingRun.workflowName,
+              executionContext: existingRun.executionContext,
+              input: existingRun.input,
+              createdAt: existingRun.createdAt,
+              expiredAt: existingRun.expiredAt,
+              startedAt: existingRun.startedAt,
+              status: 'paused',
+              output: undefined,
+              error: undefined,
+              completedAt: undefined,
+              updatedAt: now,
+            };
+            await writeJSON(runPath, run, { overwrite: true });
+          }
+        } else if (data.eventType === 'run_resumed') {
+          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
+          const existingRun = await readJSON(runPath, WorkflowRunSchema);
+          if (existingRun) {
+            run = {
+              runId: existingRun.runId,
+              deploymentId: existingRun.deploymentId,
+              workflowName: existingRun.workflowName,
+              executionContext: existingRun.executionContext,
+              input: existingRun.input,
+              createdAt: existingRun.createdAt,
+              expiredAt: existingRun.expiredAt,
+              startedAt: existingRun.startedAt,
+              status: 'running',
+              output: undefined,
+              error: undefined,
+              completedAt: undefined,
+              updatedAt: now,
+            };
+            await writeJSON(runPath, run, { overwrite: true });
+          }
+        } else if (
+          // Step lifecycle events
+          data.eventType === 'step_created' &&
+          'eventData' in data
+        ) {
+          // step_created: Creates step entity with status 'pending', attempt=0, createdAt set
+          const stepData = data.eventData as {
+            stepName: string;
+            input: any;
+          };
+          step = {
+            runId: effectiveRunId,
+            stepId: data.correlationId,
+            stepName: stepData.stepName,
+            status: 'pending',
+            input: stepData.input,
+            output: undefined,
+            lastKnownError: undefined,
+            attempt: 0,
+            firstStartedAt: undefined,
+            completedAt: undefined,
+            createdAt: now,
+            updatedAt: now,
+          };
+          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+          const stepPath = path.join(
+            basedir,
+            'steps',
+            `${stepCompositeKey}.json`
+          );
+          await writeJSON(stepPath, step);
+        } else if (data.eventType === 'step_started') {
+          // step_started: Increments attempt, sets status to 'running'
+          // Sets firstStartedAt only on the first start (not updated on retries)
+          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+          const stepPath = path.join(
+            basedir,
+            'steps',
+            `${stepCompositeKey}.json`
+          );
+          const existingStep = await readJSON(stepPath, StepSchema);
+          if (existingStep) {
+            step = {
+              ...existingStep,
+              status: 'running',
+              // Only set firstStartedAt on the first start
+              firstStartedAt: existingStep.firstStartedAt ?? now,
+              // Increment attempt counter on every start
+              attempt: existingStep.attempt + 1,
+              updatedAt: now,
+            };
+            await writeJSON(stepPath, step, { overwrite: true });
+          }
+        } else if (data.eventType === 'step_completed' && 'eventData' in data) {
+          // step_completed: Terminal state with output
+          const completedData = data.eventData as { result: any };
+          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+          const stepPath = path.join(
+            basedir,
+            'steps',
+            `${stepCompositeKey}.json`
+          );
+          const existingStep = await readJSON(stepPath, StepSchema);
+          if (existingStep) {
+            step = {
+              ...existingStep,
+              status: 'completed',
+              output: completedData.result,
+              completedAt: now,
+              updatedAt: now,
+            };
+            await writeJSON(stepPath, step, { overwrite: true });
+          }
+        } else if (data.eventType === 'step_failed' && 'eventData' in data) {
+          // step_failed: Terminal state with error (only if fatal=true)
+          // Always records lastKnownError regardless of fatal flag
+          const failedData = data.eventData as {
+            error: any;
+            stack?: string;
+            fatal?: boolean;
+          };
+          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+          const stepPath = path.join(
+            basedir,
+            'steps',
+            `${stepCompositeKey}.json`
+          );
+          const existingStep = await readJSON(stepPath, StepSchema);
+          if (existingStep) {
+            const lastKnownError = {
+              message:
+                typeof failedData.error === 'string'
+                  ? failedData.error
+                  : (failedData.error?.message ?? 'Unknown error'),
+              stack: failedData.stack,
+            };
+            // Only mark step as failed if fatal=true, otherwise just record the error
+            if (failedData.fatal) {
+              step = {
+                ...existingStep,
+                status: 'failed',
+                lastKnownError,
+                completedAt: now,
+                updatedAt: now,
+              };
+            } else {
+              // Non-fatal: just record the error, keep status unchanged
+              step = {
+                ...existingStep,
+                lastKnownError,
+                updatedAt: now,
+              };
+            }
+            await writeJSON(stepPath, step, { overwrite: true });
+          }
+        } else if (data.eventType === 'step_retrying' && 'eventData' in data) {
+          // step_retrying: Sets status back to 'pending', records error in lastKnownError
+          const retryData = data.eventData as {
+            error: any;
+            stack?: string;
+            retryAfter?: Date;
+          };
+          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+          const stepPath = path.join(
+            basedir,
+            'steps',
+            `${stepCompositeKey}.json`
+          );
+          const existingStep = await readJSON(stepPath, StepSchema);
+          if (existingStep) {
+            step = {
+              ...existingStep,
+              status: 'pending',
+              lastKnownError: {
+                message:
+                  typeof retryData.error === 'string'
+                    ? retryData.error
+                    : (retryData.error?.message ?? 'Unknown error'),
+                stack: retryData.stack,
+              },
+              retryAfter: retryData.retryAfter,
+              updatedAt: now,
+            };
+            await writeJSON(stepPath, step, { overwrite: true });
+          }
+        } else if (
+          // Hook lifecycle events
+          data.eventType === 'hook_created' &&
+          'eventData' in data
+        ) {
+          const hookData = data.eventData as {
+            token: string;
+            metadata?: any;
+          };
+
+          // Check for duplicate token before creating hook
+          const hooksDir = path.join(basedir, 'hooks');
+          const hookFiles = await listJSONFiles(hooksDir);
+          for (const file of hookFiles) {
+            const existingHookPath = path.join(hooksDir, `${file}.json`);
+            const existingHook = await readJSON(existingHookPath, HookSchema);
+            if (existingHook && existingHook.token === hookData.token) {
+              throw new Error(
+                `Hook with token ${hookData.token} already exists for this project`
+              );
+            }
+          }
+
+          hook = {
+            runId: effectiveRunId,
+            hookId: data.correlationId,
+            token: hookData.token,
+            metadata: hookData.metadata,
+            ownerId: 'local-owner',
+            projectId: 'local-project',
+            environment: 'local',
+            createdAt: now,
+          };
+          const hookPath = path.join(
+            basedir,
+            'hooks',
+            `${data.correlationId}.json`
+          );
+          await writeJSON(hookPath, hook);
+        } else if (data.eventType === 'hook_disposed') {
+          // Delete the hook when disposed
+          const hookPath = path.join(
+            basedir,
+            'hooks',
+            `${data.correlationId}.json`
+          );
+          await deleteJSON(hookPath);
+        }
+        // Note: hook_received events are stored in the event log but don't
+        // modify the Hook entity (which doesn't have a payload field)
+
         // Store event using composite key {runId}-{eventId}
-        const compositeKey = `${runId}-${eventId}`;
+        const compositeKey = `${effectiveRunId}-${eventId}`;
         const eventPath = path.join(basedir, 'events', `${compositeKey}.json`);
-        EventSchema.parse(result);
-        await writeJSON(eventPath, result);
+        await writeJSON(eventPath, event);
 
         const resolveData = params?.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
-        return filterEventData(result, resolveData);
+        const filteredEvent = filterEventData(event, resolveData);
+
+        // Return EventResult with event and any created/updated entity
+        return {
+          event: filteredEvent,
+          run,
+          step,
+          hook,
+        };
       },
 
       async list(params) {
diff --git a/packages/world-postgres/src/drizzle/schema.ts b/packages/world-postgres/src/drizzle/schema.ts
index 8a6bce004..dafcd5eb4 100644
--- a/packages/world-postgres/src/drizzle/schema.ts
+++ b/packages/world-postgres/src/drizzle/schema.ts
@@ -105,6 +105,12 @@ export const events = schema.table(
   (tb) => [index().on(tb.runId), index().on(tb.correlationId)]
 );
 
+/**
+ * Database schema for steps. Note: DB column names differ from Step interface:
+ * - error (DB) → lastKnownError (Step interface)
+ * - startedAt (DB) → firstStartedAt (Step interface)
+ * The mapping is done in storage.ts deserializeStepError()
+ */
 export const steps = schema.table(
   'workflow_steps',
   {
@@ -118,8 +124,10 @@ export const steps = schema.table(
     /** @deprecated we stream binary data */
     outputJson: jsonb('output').$type<SerializedContent>(),
     output: Cbor<SerializedContent>()('output_cbor'),
+    /** Maps to lastKnownError in Step interface */
     error: text('error'),
     attempt: integer('attempt').notNull(),
+    /** Maps to firstStartedAt in Step interface */
     startedAt: timestamp('started_at'),
     completedAt: timestamp('completed_at'),
     createdAt: timestamp('created_at').defaultNow().notNull(),
@@ -129,7 +137,14 @@ export const steps = schema.table(
       .notNull(),
     retryAfter: timestamp('retry_after'),
   } satisfies DrizzlishOfType<
-    Cborized<Omit<Step, 'input'> & { input?: unknown }, 'output' | 'input'>
+    Cborized<
+      Omit<Step, 'input' | 'lastKnownError' | 'firstStartedAt'> & {
+        input?: unknown;
+        error?: string;
+        startedAt?: Date;
+      },
+      'output' | 'input'
+    >
   >,
   (tb) => [index().on(tb.runId), index().on(tb.status)]
 );
diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index a36e1514c..4f477bf91 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -1,6 +1,7 @@
 import { WorkflowAPIError } from '@workflow/errors';
 import type {
   Event,
+  EventResult,
   Hook,
   ListEventsParams,
   ListHooksParams,
@@ -8,8 +9,6 @@ import type {
   ResolveData,
   Step,
   Storage,
-  UpdateStepRequest,
-  UpdateWorkflowRunRequest,
   WorkflowRun,
 } from '@workflow/world';
 import {
@@ -24,25 +23,6 @@ import { type Drizzle, Schema } from './drizzle/index.js';
 import type { SerializedContent } from './drizzle/schema.js';
 import { compact } from './util.js';
 
-/**
- * Serialize a StructuredError object into a JSON string
- */
-function serializeRunError(data: UpdateWorkflowRunRequest): any {
-  if (!data.error) {
-    return data;
-  }
-
-  const { error, ...rest } = data;
-  return {
-    ...rest,
-    error: JSON.stringify({
-      message: error.message,
-      stack: error.stack,
-      code: error.code,
-    }),
-  };
-}
-
 /**
  * Deserialize error JSON string (or legacy flat fields) into a StructuredError object
  * Handles backwards compatibility:
@@ -88,64 +68,46 @@ function deserializeRunError(run: any): WorkflowRun {
 }
 
 /**
- * Serialize a StructuredError object into a JSON string for steps
+ * Deserialize step data, mapping DB columns to interface fields:
+ * - `error` (DB column) → `lastKnownError` (Step interface)
+ * - `startedAt` (DB column) → `firstStartedAt` (Step interface)
  */
-function serializeStepError(data: UpdateStepRequest): any {
-  if (!data.error) {
-    return data;
-  }
+function deserializeStepError(step: any): Step {
+  const { error, startedAt, ...rest } = step;
 
-  const { error, ...rest } = data;
-  return {
+  const result: any = {
     ...rest,
-    error: JSON.stringify({
-      message: error.message,
-      stack: error.stack,
-      code: error.code,
-    }),
+    // Map startedAt to firstStartedAt
+    firstStartedAt: startedAt,
   };
-}
-
-/**
- * Deserialize error JSON string (or legacy flat fields) into a StructuredError object for steps
- */
-function deserializeStepError(step: any): Step {
-  const { error, ...rest } = step;
 
   if (!error) {
-    return step as Step;
+    return result as Step;
   }
 
   // Try to parse as structured error JSON
-  if (error) {
-    try {
-      const parsed = JSON.parse(error);
-      if (typeof parsed === 'object' && parsed.message !== undefined) {
-        return {
-          ...rest,
-          error: {
-            message: parsed.message,
-            stack: parsed.stack,
-            code: parsed.code,
-          },
-        } as Step;
-      }
-    } catch {
-      // Not JSON, treat as plain string
+  try {
+    const parsed = JSON.parse(error);
+    if (typeof parsed === 'object' && parsed.message !== undefined) {
+      result.lastKnownError = {
+        message: parsed.message,
+        stack: parsed.stack,
+        code: parsed.code,
+      };
+      return result as Step;
     }
+  } catch {
+    // Not JSON, treat as plain string
   }
 
   // Backwards compatibility: handle legacy separate fields or plain string error
-  return {
-    ...rest,
-    error: {
-      message: error || '',
-    },
-  } as Step;
+  result.lastKnownError = {
+    message: error || '',
+  };
+  return result as Step;
 }
 
 export function createRunsStorage(drizzle: Drizzle): Storage['runs'] {
-  const ulid = monotonicFactory();
   const { runs } = Schema;
   const get = drizzle
     .select()
@@ -168,76 +130,6 @@ export function createRunsStorage(drizzle: Drizzle): Storage['runs'] {
       const resolveData = params?.resolveData ?? 'all';
       return filterRunData(parsed, resolveData);
     },
-    async cancel(id, params) {
-      // TODO: we might want to guard this for only specific statuses
-      const [value] = await drizzle
-        .update(Schema.runs)
-        .set({ status: 'cancelled', completedAt: sql`now()` })
-        .where(eq(runs.runId, id))
-        .returning();
-      if (!value) {
-        throw new WorkflowAPIError(`Run not found: ${id}`, { status: 404 });
-      }
-
-      // Clean up all hooks for this run when cancelling
-      await drizzle.delete(Schema.hooks).where(eq(Schema.hooks.runId, id));
-
-      const deserialized = deserializeRunError(compact(value));
-      const parsed = WorkflowRunSchema.parse(deserialized);
-      const resolveData = params?.resolveData ?? 'all';
-      return filterRunData(parsed, resolveData);
-    },
-    async pause(id, params) {
-      // TODO: we might want to guard this for only specific statuses
-      const [value] = await drizzle
-        .update(Schema.runs)
-        .set({ status: 'paused' })
-        .where(eq(runs.runId, id))
-        .returning();
-      if (!value) {
-        throw new WorkflowAPIError(`Run not found: ${id}`, { status: 404 });
-      }
-      const deserialized = deserializeRunError(compact(value));
-      const parsed = WorkflowRunSchema.parse(deserialized);
-      const resolveData = params?.resolveData ?? 'all';
-      return filterRunData(parsed, resolveData);
-    },
-    async resume(id, params) {
-      // Fetch current run to check if startedAt is already set
-      const [currentRun] = await drizzle
-        .select()
-        .from(runs)
-        .where(eq(runs.runId, id))
-        .limit(1);
-
-      if (!currentRun) {
-        throw new WorkflowAPIError(`Run not found: ${id}`, { status: 404 });
-      }
-
-      const updates: Partial<typeof runs._.inferInsert> = {
-        status: 'running',
-      };
-
-      // Only set startedAt the first time the run transitions to 'running'
-      if (!currentRun.startedAt) {
-        updates.startedAt = new Date();
-      }
-
-      const [value] = await drizzle
-        .update(Schema.runs)
-        .set(updates)
-        .where(and(eq(runs.runId, id), eq(runs.status, 'paused')))
-        .returning();
-      if (!value) {
-        throw new WorkflowAPIError(`Paused run not found: ${id}`, {
-          status: 404,
-        });
-      }
-      const deserialized = deserializeRunError(compact(value));
-      const parsed = WorkflowRunSchema.parse(deserialized);
-      const resolveData = params?.resolveData ?? 'all';
-      return filterRunData(parsed, resolveData);
-    },
     async list(params) {
       const limit = params?.pagination?.limit ?? 20;
       const fromCursor = params?.pagination?.cursor;
@@ -268,98 +160,349 @@ export function createRunsStorage(drizzle: Drizzle): Storage['runs'] {
         cursor: values.at(-1)?.runId ?? null,
       };
     },
-    async create(data) {
-      const runId = `wrun_${ulid()}`;
-      const [value] = await drizzle
-        .insert(runs)
-        .values({
-          runId,
-          input: data.input,
-          executionContext: data.executionContext as Record<
-            string,
-            unknown
-          > | null,
-          deploymentId: data.deploymentId,
-          status: 'pending',
-          workflowName: data.workflowName,
-        })
-        .onConflictDoNothing()
-        .returning();
-      if (!value) {
-        throw new WorkflowAPIError(`Run ${runId} already exists`, {
-          status: 409,
-        });
+  };
+}
+
+function map<T, R>(obj: T | null | undefined, fn: (v: T) => R): undefined | R {
+  return obj ? fn(obj) : undefined;
+}
+
+export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
+  const ulid = monotonicFactory();
+  const { events } = Schema;
+
+  return {
+    async create(runId, data, params): Promise<EventResult> {
+      const eventId = `wevt_${ulid()}`;
+
+      // For run_created events, generate runId server-side if null or empty
+      let effectiveRunId: string;
+      if (data.eventType === 'run_created' && (!runId || runId === '')) {
+        effectiveRunId = `wrun_${ulid()}`;
+      } else if (!runId) {
+        throw new Error('runId is required for non-run_created events');
+      } else {
+        effectiveRunId = runId;
       }
-      return deserializeRunError(compact(value));
-    },
-    async update(id, data) {
-      // Fetch current run to check if startedAt is already set
-      const [currentRun] = await drizzle
-        .select()
-        .from(runs)
-        .where(eq(runs.runId, id))
-        .limit(1);
 
-      if (!currentRun) {
-        throw new WorkflowAPIError(`Run not found: ${id}`, { status: 404 });
+      // Track entity created/updated for EventResult
+      let run: WorkflowRun | undefined;
+      let step: Step | undefined;
+      let hook: Hook | undefined;
+      const now = new Date();
+
+      // Handle run_created event: create the run entity atomically
+      if (data.eventType === 'run_created') {
+        const eventData = (data as any).eventData as {
+          deploymentId: string;
+          workflowName: string;
+          input: any[];
+          executionContext?: Record<string, any>;
+        };
+        const [runValue] = await drizzle
+          .insert(Schema.runs)
+          .values({
+            runId: effectiveRunId,
+            deploymentId: eventData.deploymentId,
+            workflowName: eventData.workflowName,
+            input: eventData.input as SerializedContent,
+            executionContext: eventData.executionContext as
+              | SerializedContent
+              | undefined,
+            status: 'pending',
+          })
+          .onConflictDoNothing()
+          .returning();
+        if (runValue) {
+          run = deserializeRunError(compact(runValue));
+        }
       }
 
-      // Serialize the error field if present
-      const serialized = serializeRunError(data);
+      // Handle run_started event: update run status
+      if (data.eventType === 'run_started') {
+        const [runValue] = await drizzle
+          .update(Schema.runs)
+          .set({
+            status: 'running',
+            startedAt: now,
+            updatedAt: now,
+          })
+          .where(eq(Schema.runs.runId, effectiveRunId))
+          .returning();
+        if (runValue) {
+          run = deserializeRunError(compact(runValue));
+        }
+      }
 
-      const updates: Partial<typeof runs._.inferInsert> = {
-        ...serialized,
-        output: data.output as SerializedContent,
-      };
+      // Handle run_completed event: update run status and cleanup hooks
+      if (data.eventType === 'run_completed') {
+        const eventData = (data as any).eventData as { output?: any };
+        const [runValue] = await drizzle
+          .update(Schema.runs)
+          .set({
+            status: 'completed',
+            output: eventData.output as SerializedContent | undefined,
+            completedAt: now,
+            updatedAt: now,
+          })
+          .where(eq(Schema.runs.runId, effectiveRunId))
+          .returning();
+        if (runValue) {
+          run = deserializeRunError(compact(runValue));
+        }
+        // Delete all hooks for this run to allow token reuse
+        await drizzle
+          .delete(Schema.hooks)
+          .where(eq(Schema.hooks.runId, effectiveRunId));
+      }
 
-      // Only set startedAt the first time transitioning to 'running'
-      if (data.status === 'running' && !currentRun.startedAt) {
-        updates.startedAt = new Date();
+      // Handle run_failed event: update run status and cleanup hooks
+      if (data.eventType === 'run_failed') {
+        const eventData = (data as any).eventData as {
+          error: any;
+          errorCode?: string;
+        };
+        const errorMessage =
+          typeof eventData.error === 'string'
+            ? eventData.error
+            : (eventData.error?.message ?? 'Unknown error');
+        // Store structured error as JSON for deserializeRunError to parse
+        const errorJson = JSON.stringify({
+          message: errorMessage,
+          stack: eventData.error?.stack,
+          code: eventData.errorCode,
+        });
+        const [runValue] = await drizzle
+          .update(Schema.runs)
+          .set({
+            status: 'failed',
+            error: errorJson,
+            completedAt: now,
+            updatedAt: now,
+          })
+          .where(eq(Schema.runs.runId, effectiveRunId))
+          .returning();
+        if (runValue) {
+          run = deserializeRunError(compact(runValue));
+        }
+        // Delete all hooks for this run to allow token reuse
+        await drizzle
+          .delete(Schema.hooks)
+          .where(eq(Schema.hooks.runId, effectiveRunId));
       }
 
-      const isBecomingTerminal =
-        data.status === 'completed' ||
-        data.status === 'failed' ||
-        data.status === 'cancelled';
+      // Handle run_cancelled event: update run status and cleanup hooks
+      if (data.eventType === 'run_cancelled') {
+        const [runValue] = await drizzle
+          .update(Schema.runs)
+          .set({
+            status: 'cancelled',
+            completedAt: now,
+            updatedAt: now,
+          })
+          .where(eq(Schema.runs.runId, effectiveRunId))
+          .returning();
+        if (runValue) {
+          run = deserializeRunError(compact(runValue));
+        }
+        // Delete all hooks for this run to allow token reuse
+        await drizzle
+          .delete(Schema.hooks)
+          .where(eq(Schema.hooks.runId, effectiveRunId));
+      }
 
-      if (isBecomingTerminal) {
-        updates.completedAt = new Date();
+      // Handle step_created event: create step entity
+      if (data.eventType === 'step_created') {
+        const eventData = (data as any).eventData as {
+          stepName: string;
+          input: any;
+        };
+        const [stepValue] = await drizzle
+          .insert(Schema.steps)
+          .values({
+            runId: effectiveRunId,
+            stepId: data.correlationId!,
+            stepName: eventData.stepName,
+            input: eventData.input as SerializedContent,
+            status: 'pending',
+            attempt: 0,
+          })
+          .onConflictDoNothing()
+          .returning();
+        if (stepValue) {
+          step = deserializeStepError(compact(stepValue));
+        }
       }
 
-      const [value] = await drizzle
-        .update(runs)
-        .set(updates)
-        .where(eq(runs.runId, id))
-        .returning();
-      if (!value) {
-        throw new WorkflowAPIError(`Run not found: ${id}`, { status: 404 });
+      // Handle step_started event: increment attempt, set status to 'running'
+      // Sets startedAt (maps to firstStartedAt) only on first start
+      if (data.eventType === 'step_started') {
+        // First, get the current step to check attempt
+        const [existingStep] = await drizzle
+          .select()
+          .from(Schema.steps)
+          .where(
+            and(
+              eq(Schema.steps.runId, effectiveRunId),
+              eq(Schema.steps.stepId, data.correlationId!)
+            )
+          )
+          .limit(1);
+
+        const isFirstStart = !existingStep?.startedAt;
+
+        const [stepValue] = await drizzle
+          .update(Schema.steps)
+          .set({
+            status: 'running',
+            // Increment attempt counter using SQL
+            attempt: sql`${Schema.steps.attempt} + 1`,
+            // Only set startedAt on first start (not updated on retries)
+            ...(isFirstStart ? { startedAt: now } : {}),
+          })
+          .where(
+            and(
+              eq(Schema.steps.runId, effectiveRunId),
+              eq(Schema.steps.stepId, data.correlationId!)
+            )
+          )
+          .returning();
+        if (stepValue) {
+          step = deserializeStepError(compact(stepValue));
+        }
       }
 
-      // If transitioning to a terminal status, clean up all hooks for this run
-      if (isBecomingTerminal) {
-        await drizzle.delete(Schema.hooks).where(eq(Schema.hooks.runId, id));
+      // Handle step_completed event: update step status
+      if (data.eventType === 'step_completed') {
+        const eventData = (data as any).eventData as { result?: any };
+        const [stepValue] = await drizzle
+          .update(Schema.steps)
+          .set({
+            status: 'completed',
+            output: eventData.result as SerializedContent | undefined,
+            completedAt: now,
+          })
+          .where(
+            and(
+              eq(Schema.steps.runId, effectiveRunId),
+              eq(Schema.steps.stepId, data.correlationId!)
+            )
+          )
+          .returning();
+        if (stepValue) {
+          step = deserializeStepError(compact(stepValue));
+        }
       }
 
-      return deserializeRunError(compact(value));
-    },
-  };
-}
+      // Handle step_failed event: terminal state with error (only if fatal=true)
+      // Always records lastKnownError regardless of fatal flag
+      if (data.eventType === 'step_failed') {
+        const eventData = (data as any).eventData as {
+          error?: any;
+          stack?: string;
+          fatal?: boolean;
+        };
+        // Store structured error as JSON for deserializeStepError to parse
+        const errorMessage =
+          typeof eventData.error === 'string'
+            ? eventData.error
+            : (eventData.error?.message ?? 'Unknown error');
+        const errorJson = JSON.stringify({
+          message: errorMessage,
+          stack: eventData.stack,
+        });
 
-function map<T, R>(obj: T | null | undefined, fn: (v: T) => R): undefined | R {
-  return obj ? fn(obj) : undefined;
-}
+        const updateData: Partial<typeof Schema.steps._.inferInsert> = {
+          // Always record the error in lastKnownError (stored as 'error' column)
+          error: errorJson,
+        };
+
+        // Only mark step as failed if fatal=true
+        if (eventData.fatal) {
+          updateData.status = 'failed';
+          updateData.completedAt = now;
+        }
+
+        const [stepValue] = await drizzle
+          .update(Schema.steps)
+          .set(updateData)
+          .where(
+            and(
+              eq(Schema.steps.runId, effectiveRunId),
+              eq(Schema.steps.stepId, data.correlationId!)
+            )
+          )
+          .returning();
+        if (stepValue) {
+          step = deserializeStepError(compact(stepValue));
+        }
+      }
 
-export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
-  const ulid = monotonicFactory();
-  const { events } = Schema;
+      // Handle step_retrying event: sets status back to 'pending', records error in lastKnownError
+      if (data.eventType === 'step_retrying') {
+        const eventData = (data as any).eventData as {
+          error?: any;
+          stack?: string;
+          retryAfter?: Date;
+        };
+        // Store error in lastKnownError (stored as 'error' column)
+        const errorMessage =
+          typeof eventData.error === 'string'
+            ? eventData.error
+            : (eventData.error?.message ?? 'Unknown error');
+        const errorJson = JSON.stringify({
+          message: errorMessage,
+          stack: eventData.stack,
+        });
+
+        const [stepValue] = await drizzle
+          .update(Schema.steps)
+          .set({
+            status: 'pending',
+            error: errorJson,
+            retryAfter: eventData.retryAfter,
+          })
+          .where(
+            and(
+              eq(Schema.steps.runId, effectiveRunId),
+              eq(Schema.steps.stepId, data.correlationId!)
+            )
+          )
+          .returning();
+        if (stepValue) {
+          step = deserializeStepError(compact(stepValue));
+        }
+      }
+
+      // Handle hook_created event: create hook entity
+      if (data.eventType === 'hook_created') {
+        const eventData = (data as any).eventData as {
+          token: string;
+          metadata?: any;
+        };
+        const [hookValue] = await drizzle
+          .insert(Schema.hooks)
+          .values({
+            runId: effectiveRunId,
+            hookId: data.correlationId!,
+            token: eventData.token,
+            metadata: eventData.metadata as SerializedContent,
+            ownerId: '', // TODO: get from context
+            projectId: '', // TODO: get from context
+            environment: '', // TODO: get from context
+          })
+          .onConflictDoNothing()
+          .returning();
+        if (hookValue) {
+          hookValue.metadata ||= hookValue.metadataJson;
+          hook = HookSchema.parse(compact(hookValue));
+        }
+      }
 
-  return {
-    async create(runId, data, params) {
-      const eventId = `wevt_${ulid()}`;
       const [value] = await drizzle
         .insert(events)
         .values({
-          runId,
+          runId: effectiveRunId,
           eventId,
           correlationId: data.correlationId,
           eventType: data.eventType,
@@ -371,10 +514,10 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
           status: 409,
         });
       }
-      const result = { ...data, ...value, runId, eventId };
+      const result = { ...data, ...value, runId: effectiveRunId, eventId };
       const parsed = EventSchema.parse(result);
       const resolveData = params?.resolveData ?? 'all';
-      return filterEventData(parsed, resolveData);
+      return { event: filterEventData(parsed, resolveData), run, step, hook };
     },
     async list(params: ListEventsParams): Promise<PaginatedResponse<Event>> {
       const limit = params?.pagination?.limit ?? 100;
@@ -468,30 +611,6 @@ export function createHooksStorage(drizzle: Drizzle): Storage['hooks'] {
       const resolveData = params?.resolveData ?? 'all';
       return filterHookData(parsed, resolveData);
     },
-    async create(runId, data, params) {
-      const [value] = await drizzle
-        .insert(hooks)
-        .values({
-          runId,
-          hookId: data.hookId,
-          token: data.token,
-          metadata: data.metadata as SerializedContent,
-          ownerId: '', // TODO: get from context
-          projectId: '', // TODO: get from context
-          environment: '', // TODO: get from context
-        })
-        .onConflictDoNothing()
-        .returning();
-      if (!value) {
-        throw new WorkflowAPIError(`Hook ${data.hookId} already exists`, {
-          status: 409,
-        });
-      }
-      value.metadata ||= value.metadataJson;
-      const parsed = HookSchema.parse(compact(value));
-      const resolveData = params?.resolveData ?? 'all';
-      return filterHookData(parsed, resolveData);
-    },
     async getByToken(token, params) {
       const [value] = await getByToken.execute({ token });
       if (!value) {
@@ -532,20 +651,6 @@ export function createHooksStorage(drizzle: Drizzle): Storage['hooks'] {
         hasMore,
       };
     },
-    async dispose(hookId, params) {
-      const [value] = await drizzle
-        .delete(hooks)
-        .where(eq(hooks.hookId, hookId))
-        .returning();
-      if (!value) {
-        throw new WorkflowAPIError(`Hook not found: ${hookId}`, {
-          status: 404,
-        });
-      }
-      const parsed = HookSchema.parse(compact(value));
-      const resolveData = params?.resolveData ?? 'all';
-      return filterHookData(parsed, resolveData);
-    },
   };
 }
 
@@ -553,28 +658,6 @@ export function createStepsStorage(drizzle: Drizzle): Storage['steps'] {
   const { steps } = Schema;
 
   return {
-    async create(runId, data) {
-      const [value] = await drizzle
-        .insert(steps)
-        .values({
-          runId,
-          stepId: data.stepId,
-          stepName: data.stepName,
-          input: data.input as SerializedContent,
-          status: 'pending',
-          attempt: 0,
-        })
-        .onConflictDoNothing()
-        .returning();
-
-      if (!value) {
-        throw new WorkflowAPIError(`Step ${data.stepId} already exists`, {
-          status: 409,
-        });
-      }
-      return deserializeStepError(compact(value));
-    },
-
     async get(runId, stepId, params) {
       // If runId is not provided, query only by stepId
       const whereClause = runId
@@ -598,47 +681,6 @@ export function createStepsStorage(drizzle: Drizzle): Storage['steps'] {
       const resolveData = params?.resolveData ?? 'all';
       return filterStepData(parsed, resolveData);
     },
-    async update(runId, stepId, data) {
-      // Fetch current step to check if startedAt is already set
-      const [currentStep] = await drizzle
-        .select()
-        .from(steps)
-        .where(and(eq(steps.stepId, stepId), eq(steps.runId, runId)))
-        .limit(1);
-
-      if (!currentStep) {
-        throw new WorkflowAPIError(`Step not found: ${stepId}`, {
-          status: 404,
-        });
-      }
-
-      // Serialize the error field if present
-      const serialized = serializeStepError(data);
-
-      const updates: Partial<typeof steps._.inferInsert> = {
-        ...serialized,
-        output: data.output as SerializedContent,
-      };
-      const now = new Date();
-      // Only set startedAt the first time the step transitions to 'running'
-      if (data.status === 'running' && !currentStep.startedAt) {
-        updates.startedAt = now;
-      }
-      if (data.status === 'completed' || data.status === 'failed') {
-        updates.completedAt = now;
-      }
-      const [value] = await drizzle
-        .update(steps)
-        .set(updates)
-        .where(and(eq(steps.stepId, stepId), eq(steps.runId, runId)))
-        .returning();
-      if (!value) {
-        throw new WorkflowAPIError(`Step not found: ${stepId}`, {
-          status: 404,
-        });
-      }
-      return deserializeStepError(compact(value));
-    },
     async list(params) {
       const limit = params?.pagination?.limit ?? 20;
       const fromCursor = params?.pagination?.cursor;
diff --git a/packages/world-postgres/test/storage.test.ts b/packages/world-postgres/test/storage.test.ts
index b28ab5a83..aa219886c 100644
--- a/packages/world-postgres/test/storage.test.ts
+++ b/packages/world-postgres/test/storage.test.ts
@@ -1,5 +1,6 @@
 import { execSync } from 'node:child_process';
 import { PostgreSqlContainer } from '@testcontainers/postgresql';
+import type { Hook, Step, WorkflowRun } from '@workflow/world';
 import postgres from 'postgres';
 import {
   afterAll,
@@ -17,6 +18,103 @@ import {
   createStepsStorage,
 } from '../src/storage.js';
 
+// Helper types for events storage
+type EventsStorage = ReturnType<typeof createEventsStorage>;
+
+// Helper functions to create entities through events.create
+async function createRun(
+  events: EventsStorage,
+  data: {
+    deploymentId: string;
+    workflowName: string;
+    input: unknown[];
+    executionContext?: Record<string, unknown>;
+  }
+): Promise<WorkflowRun> {
+  const result = await events.create(null, {
+    eventType: 'run_created',
+    eventData: data,
+  });
+  if (!result.run) {
+    throw new Error('Expected run to be created');
+  }
+  return result.run;
+}
+
+async function updateRun(
+  events: EventsStorage,
+  runId: string,
+  eventType: 'run_started' | 'run_completed' | 'run_failed',
+  eventData?: Record<string, unknown>
+): Promise<WorkflowRun> {
+  const result = await events.create(runId, {
+    eventType,
+    eventData,
+  });
+  if (!result.run) {
+    throw new Error('Expected run to be updated');
+  }
+  return result.run;
+}
+
+async function createStep(
+  events: EventsStorage,
+  runId: string,
+  data: {
+    stepId: string;
+    stepName: string;
+    input: unknown[];
+  }
+): Promise<Step> {
+  const result = await events.create(runId, {
+    eventType: 'step_created',
+    correlationId: data.stepId,
+    eventData: { stepName: data.stepName, input: data.input },
+  });
+  if (!result.step) {
+    throw new Error('Expected step to be created');
+  }
+  return result.step;
+}
+
+async function updateStep(
+  events: EventsStorage,
+  runId: string,
+  stepId: string,
+  eventType: 'step_started' | 'step_completed' | 'step_failed',
+  eventData?: Record<string, unknown>
+): Promise<Step> {
+  const result = await events.create(runId, {
+    eventType,
+    correlationId: stepId,
+    eventData,
+  });
+  if (!result.step) {
+    throw new Error('Expected step to be updated');
+  }
+  return result.step;
+}
+
+async function createHook(
+  events: EventsStorage,
+  runId: string,
+  data: {
+    hookId: string;
+    token: string;
+    metadata?: unknown;
+  }
+): Promise<Hook> {
+  const result = await events.create(runId, {
+    eventType: 'hook_created',
+    correlationId: data.hookId,
+    eventData: { token: data.token, metadata: data.metadata },
+  });
+  if (!result.hook) {
+    throw new Error('Expected hook to be created');
+  }
+  return result.hook;
+}
+
 describe('Storage (Postgres integration)', () => {
   if (process.platform === 'win32') {
     test.skip('skipped on Windows since it relies on a docker container', () => {});
@@ -75,7 +173,7 @@ describe('Storage (Postgres integration)', () => {
           input: ['arg1', 'arg2'],
         };
 
-        const run = await runs.create(runData);
+        const run = await createRun(events, runData);
 
         expect(run.runId).toMatch(/^wrun_/);
         expect(run.deploymentId).toBe('deployment-123');
@@ -98,7 +196,7 @@ describe('Storage (Postgres integration)', () => {
           input: [],
         };
 
-        const run = await runs.create(runData);
+        const run = await createRun(events, runData);
 
         expect(run.executionContext).toBeUndefined();
         expect(run.input).toEqual([]);
@@ -107,7 +205,7 @@ describe('Storage (Postgres integration)', () => {
 
     describe('get', () => {
       it('should retrieve an existing run', async () => {
-        const created = await runs.create({
+        const created = await createRun(events, {
           deploymentId: 'deployment-123',
           workflowName: 'test-workflow',
           input: ['arg'],
@@ -126,72 +224,59 @@ describe('Storage (Postgres integration)', () => {
       });
     });
 
-    describe('update', () => {
-      it('should update run status to running', async () => {
-        const created = await runs.create({
+    describe('update via events', () => {
+      it('should update run status to running via run_started event', async () => {
+        const created = await createRun(events, {
           deploymentId: 'deployment-123',
           workflowName: 'test-workflow',
           input: [],
         });
 
-        const updated = await runs.update(created.runId, {
-          status: 'running',
-        });
+        const updated = await updateRun(events, created.runId, 'run_started');
         expect(updated.status).toBe('running');
         expect(updated.startedAt).toBeInstanceOf(Date);
       });
 
-      it('should update run status to completed', async () => {
-        const created = await runs.create({
+      it('should update run status to completed via run_completed event', async () => {
+        const created = await createRun(events, {
           deploymentId: 'deployment-123',
           workflowName: 'test-workflow',
           input: [],
         });
 
-        const updated = await runs.update(created.runId, {
-          status: 'completed',
-          output: [{ result: 42 }],
-        });
+        const updated = await updateRun(
+          events,
+          created.runId,
+          'run_completed',
+          {
+            output: [{ result: 42 }],
+          }
+        );
         expect(updated.status).toBe('completed');
         expect(updated.completedAt).toBeInstanceOf(Date);
         expect(updated.output).toEqual([{ result: 42 }]);
       });
 
-      it('should update run status to failed', async () => {
-        const created = await runs.create({
+      it('should update run status to failed via run_failed event', async () => {
+        const created = await createRun(events, {
           deploymentId: 'deployment-123',
           workflowName: 'test-workflow',
           input: [],
         });
 
-        const updated = await runs.update(created.runId, {
-          status: 'failed',
-          error: {
-            message: 'Something went wrong',
-            code: 'ERR_001',
-          },
+        const updated = await updateRun(events, created.runId, 'run_failed', {
+          error: 'Something went wrong',
         });
 
         expect(updated.status).toBe('failed');
-        expect(updated.error).toEqual({
-          message: 'Something went wrong',
-          code: 'ERR_001',
-        });
+        expect(updated.error?.message).toBe('Something went wrong');
         expect(updated.completedAt).toBeInstanceOf(Date);
       });
-
-      it('should throw error for non-existent run', async () => {
-        await expect(
-          runs.update('missing', { status: 'running' })
-        ).rejects.toMatchObject({
-          status: 404,
-        });
-      });
     });
 
     describe('list', () => {
       it('should list all runs', async () => {
-        const run1 = await runs.create({
+        const run1 = await createRun(events, {
           deploymentId: 'deployment-1',
           workflowName: 'workflow-1',
           input: [],
@@ -200,7 +285,7 @@ describe('Storage (Postgres integration)', () => {
         // Small delay to ensure different timestamps in createdAt
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const run2 = await runs.create({
+        const run2 = await createRun(events, {
           deploymentId: 'deployment-2',
           workflowName: 'workflow-2',
           input: [],
@@ -218,12 +303,12 @@ describe('Storage (Postgres integration)', () => {
       });
 
       it('should filter runs by workflowName', async () => {
-        await runs.create({
+        await createRun(events, {
           deploymentId: 'deployment-1',
           workflowName: 'workflow-1',
           input: [],
         });
-        const run2 = await runs.create({
+        const run2 = await createRun(events, {
           deploymentId: 'deployment-2',
           workflowName: 'workflow-2',
           input: [],
@@ -238,7 +323,7 @@ describe('Storage (Postgres integration)', () => {
       it('should support pagination', async () => {
         // Create multiple runs
         for (let i = 0; i < 5; i++) {
-          await runs.create({
+          await createRun(events, {
             deploymentId: `deployment-${i}`,
             workflowName: `workflow-${i}`,
             input: [],
@@ -260,58 +345,13 @@ describe('Storage (Postgres integration)', () => {
         expect(page2.data[0].runId).not.toBe(page1.data[0].runId);
       });
     });
-
-    describe('cancel', () => {
-      it('should cancel a run', async () => {
-        const created = await runs.create({
-          deploymentId: 'deployment-123',
-          workflowName: 'test-workflow',
-          input: [],
-        });
-
-        const cancelled = await runs.cancel(created.runId);
-
-        expect(cancelled.status).toBe('cancelled');
-        expect(cancelled.completedAt).toBeInstanceOf(Date);
-      });
-    });
-
-    describe('pause', () => {
-      it('should pause a run', async () => {
-        const created = await runs.create({
-          deploymentId: 'deployment-123',
-          workflowName: 'test-workflow',
-          input: [],
-        });
-
-        const paused = await runs.pause(created.runId);
-
-        expect(paused.status).toBe('paused');
-      });
-    });
-
-    describe('resume', () => {
-      it('should resume a paused run', async () => {
-        const created = await runs.create({
-          deploymentId: 'deployment-123',
-          workflowName: 'test-workflow',
-          input: [],
-        });
-
-        await runs.pause(created.runId);
-        const resumed = await runs.resume(created.runId);
-
-        expect(resumed.status).toBe('running');
-        expect(resumed.startedAt).toBeInstanceOf(Date);
-      });
-    });
   });
 
   describe('steps', () => {
     let testRunId: string;
 
     beforeEach(async () => {
-      const run = await runs.create({
+      const run = await createRun(events, {
         deploymentId: 'deployment-123',
         workflowName: 'test-workflow',
         input: [],
@@ -327,7 +367,7 @@ describe('Storage (Postgres integration)', () => {
           input: ['input1', 'input2'],
         };
 
-        const step = await steps.create(testRunId, stepData);
+        const step = await createStep(events, testRunId, stepData);
 
         expect(step).toEqual({
           runId: testRunId,
@@ -336,9 +376,9 @@ describe('Storage (Postgres integration)', () => {
           status: 'pending',
           input: ['input1', 'input2'],
           output: undefined,
-          error: undefined,
+          lastKnownError: undefined,
           attempt: 0, // steps are created with attempt 0
-          startedAt: undefined,
+          firstStartedAt: undefined,
           completedAt: undefined,
           createdAt: expect.any(Date),
           updatedAt: expect.any(Date),
@@ -348,7 +388,7 @@ describe('Storage (Postgres integration)', () => {
 
     describe('get', () => {
       it('should retrieve a step with runId and stepId', async () => {
-        const created = await steps.create(testRunId, {
+        const created = await createStep(events, testRunId, {
           stepId: 'step-123',
           stepName: 'test-step',
           input: ['input1'],
@@ -360,7 +400,7 @@ describe('Storage (Postgres integration)', () => {
       });
 
       it('should retrieve a step with only stepId', async () => {
-        const created = await steps.create(testRunId, {
+        const created = await createStep(events, testRunId, {
           stepId: 'unique-step-123',
           stepName: 'test-step',
           input: ['input1'],
@@ -378,83 +418,76 @@ describe('Storage (Postgres integration)', () => {
       });
     });
 
-    describe('update', () => {
-      it('should update step status to running', async () => {
-        await steps.create(testRunId, {
+    describe('update via events', () => {
+      it('should update step status to running via step_started event', async () => {
+        await createStep(events, testRunId, {
           stepId: 'step-123',
           stepName: 'test-step',
           input: ['input1'],
         });
 
-        const updated = await steps.update(testRunId, 'step-123', {
-          status: 'running',
-        });
+        const updated = await updateStep(
+          events,
+          testRunId,
+          'step-123',
+          'step_started',
+          {} // step_started no longer needs attempt in eventData - World increments it
+        );
 
         expect(updated.status).toBe('running');
-        expect(updated.startedAt).toBeInstanceOf(Date);
+        expect(updated.firstStartedAt).toBeInstanceOf(Date);
+        expect(updated.attempt).toBe(1); // Incremented by step_started
       });
 
-      it('should update step status to completed', async () => {
-        await steps.create(testRunId, {
+      it('should update step status to completed via step_completed event', async () => {
+        await createStep(events, testRunId, {
           stepId: 'step-123',
           stepName: 'test-step',
           input: ['input1'],
         });
 
-        const updated = await steps.update(testRunId, 'step-123', {
-          status: 'completed',
-          output: ['ok'],
-        });
+        const updated = await updateStep(
+          events,
+          testRunId,
+          'step-123',
+          'step_completed',
+          { result: ['ok'] }
+        );
 
         expect(updated.status).toBe('completed');
         expect(updated.completedAt).toBeInstanceOf(Date);
         expect(updated.output).toEqual(['ok']);
       });
 
-      it('should update step status to failed', async () => {
-        await steps.create(testRunId, {
+      it('should update step status to failed via step_failed event', async () => {
+        await createStep(events, testRunId, {
           stepId: 'step-123',
           stepName: 'test-step',
           input: ['input1'],
         });
 
-        const updated = await steps.update(testRunId, 'step-123', {
-          status: 'failed',
-          error: {
-            message: 'Step failed',
-            code: 'STEP_ERR',
-          },
-        });
+        const updated = await updateStep(
+          events,
+          testRunId,
+          'step-123',
+          'step_failed',
+          { error: 'Step failed', fatal: true }
+        );
 
         expect(updated.status).toBe('failed');
-        expect(updated.error?.message).toBe('Step failed');
-        expect(updated.error?.code).toBe('STEP_ERR');
+        expect(updated.lastKnownError?.message).toBe('Step failed');
         expect(updated.completedAt).toBeInstanceOf(Date);
       });
-
-      it('should update attempt count', async () => {
-        await steps.create(testRunId, {
-          stepId: 'step-123',
-          stepName: 'test-step',
-          input: ['input1'],
-        });
-
-        const updated = await steps.update(testRunId, 'step-123', {
-          attempt: 2,
-        });
-
-        expect(updated.attempt).toBe(2);
-      });
     });
 
     describe('list', () => {
       it('should list all steps for a run', async () => {
-        const step1 = await steps.create(testRunId, {
+        const step1 = await createStep(events, testRunId, {
           stepId: 'step-1',
           stepName: 'first-step',
           input: [],
         });
-        const step2 = await steps.create(testRunId, {
+        const step2 = await createStep(events, testRunId, {
           stepId: 'step-2',
           stepName: 'second-step',
           input: [],
@@ -476,7 +509,7 @@ describe('Storage (Postgres integration)', () => {
       it('should support pagination', async () => {
         // Create multiple steps
         for (let i = 0; i < 5; i++) {
-          await steps.create(testRunId, {
+          await createStep(events, testRunId, {
             stepId: `step-${i}`,
             stepName: `step-name-${i}`,
             input: [],
@@ -506,7 +539,7 @@ describe('Storage (Postgres integration)', () => {
     let testRunId: string;
 
     beforeEach(async () => {
-      const run = await runs.create({
+      const run = await createRun(events, {
         deploymentId: 'deployment-123',
         workflowName: 'test-workflow',
         input: [],
@@ -521,27 +554,27 @@ describe('Storage (Postgres integration)', () => {
           correlationId: 'corr_123',
         };
 
-        const event = await events.create(testRunId, eventData);
+        const result = await events.create(testRunId, eventData);
 
-        expect(event.runId).toBe(testRunId);
-        expect(event.eventId).toMatch(/^wevt_/);
-        expect(event.eventType).toBe('step_started');
-        expect(event.correlationId).toBe('corr_123');
-        expect(event.createdAt).toBeInstanceOf(Date);
+        expect(result.event.runId).toBe(testRunId);
+        expect(result.event.eventId).toMatch(/^wevt_/);
+        expect(result.event.eventType).toBe('step_started');
+        expect(result.event.correlationId).toBe('corr_123');
+        expect(result.event.createdAt).toBeInstanceOf(Date);
       });
 
       it('should create a new event with null byte in payload', async () => {
-        const event = await events.create(testRunId, {
+        const result = await events.create(testRunId, {
           eventType: 'step_failed',
           correlationId: 'corr_123',
           eventData: { error: 'Error with null byte \u0000 in message' },
         });
 
-        expect(event.runId).toBe(testRunId);
-        expect(event.eventId).toMatch(/^wevt_/);
-        expect(event.eventType).toBe('step_failed');
-        expect(event.correlationId).toBe('corr_123');
-        expect(event.createdAt).toBeInstanceOf(Date);
+        expect(result.event.runId).toBe(testRunId);
+        expect(result.event.eventId).toMatch(/^wevt_/);
+        expect(result.event.eventType).toBe('step_failed');
+        expect(result.event.correlationId).toBe('corr_123');
+        expect(result.event.createdAt).toBeInstanceOf(Date);
       });
 
       it('should handle workflow completed events', async () => {
@@ -549,23 +582,23 @@ describe('Storage (Postgres integration)', () => {
           eventType: 'workflow_completed' as const,
         };
 
-        const event = await events.create(testRunId, eventData);
+        const result = await events.create(testRunId, eventData);
 
-        expect(event.eventType).toBe('workflow_completed');
-        expect(event.correlationId).toBeUndefined();
+        expect(result.event.eventType).toBe('workflow_completed');
+        expect(result.event.correlationId).toBeUndefined();
       });
     });
 
     describe('list', () => {
       it('should list all events for a run', async () => {
-        const event1 = await events.create(testRunId, {
+        const result1 = await events.create(testRunId, {
           eventType: 'workflow_started' as const,
         });
 
         // Small delay to ensure different timestamps in event IDs
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await events.create(testRunId, {
+        const result2 = await events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId: 'corr-step-1',
         });
@@ -575,24 +608,26 @@ describe('Storage (Postgres integration)', () => {
           pagination: { sortOrder: 'asc' }, // Explicitly request ascending order
         });
 
-        expect(result.data).toHaveLength(2);
+        // 3 events: run_created (from createRun), workflow_started, step_started
+        expect(result.data).toHaveLength(3);
         // Should be in chronological order (oldest first)
-        expect(result.data[0].eventId).toBe(event1.eventId);
-        expect(result.data[1].eventId).toBe(event2.eventId);
-        expect(result.data[1].createdAt.getTime()).toBeGreaterThanOrEqual(
-          result.data[0].createdAt.getTime()
+        expect(result.data[0].eventType).toBe('run_created');
+        expect(result.data[1].eventId).toBe(result1.event.eventId);
+        expect(result.data[2].eventId).toBe(result2.event.eventId);
+        expect(result.data[2].createdAt.getTime()).toBeGreaterThanOrEqual(
+          result.data[1].createdAt.getTime()
         );
       });
 
       it('should list events in descending order when explicitly requested (newest first)', async () => {
-        const event1 = await events.create(testRunId, {
+        const result1 = await events.create(testRunId, {
           eventType: 'workflow_started' as const,
         });
 
         // Small delay to ensure different timestamps in event IDs
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await events.create(testRunId, {
+        const result2 = await events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId: 'corr-step-1',
         });
@@ -602,10 +637,12 @@ describe('Storage (Postgres integration)', () => {
           pagination: { sortOrder: 'desc' },
         });
 
-        expect(result.data).toHaveLength(2);
+        // 3 events: run_created (from createRun), workflow_started, step_started
+        expect(result.data).toHaveLength(3);
         // Should be in reverse chronological order (newest first)
-        expect(result.data[0].eventId).toBe(event2.eventId);
-        expect(result.data[1].eventId).toBe(event1.eventId);
+        expect(result.data[0].eventId).toBe(result2.event.eventId);
+        expect(result.data[1].eventId).toBe(result1.event.eventId);
+        expect(result.data[2].eventType).toBe('run_created');
         expect(result.data[0].createdAt.getTime()).toBeGreaterThanOrEqual(
           result.data[1].createdAt.getTime()
         );
@@ -644,14 +681,14 @@ describe('Storage (Postgres integration)', () => {
         const correlationId = 'step-abc123';
 
         // Create events with the target correlation ID
-        const event1 = await events.create(testRunId, {
+        const result1 = await events.create(testRunId, {
           eventType: 'step_started',
           correlationId,
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await events.create(testRunId, {
+        const result2 = await events.create(testRunId, {
           eventType: 'step_completed',
           correlationId,
           eventData: { result: 'success' },
@@ -672,9 +709,9 @@ describe('Storage (Postgres integration)', () => {
         });
 
         expect(result.data).toHaveLength(2);
-        expect(result.data[0].eventId).toBe(event1.eventId);
+        expect(result.data[0].eventId).toBe(result1.event.eventId);
         expect(result.data[0].correlationId).toBe(correlationId);
-        expect(result.data[1].eventId).toBe(event2.eventId);
+        expect(result.data[1].eventId).toBe(result2.event.eventId);
         expect(result.data[1].correlationId).toBe(correlationId);
       });
 
@@ -682,21 +719,22 @@ describe('Storage (Postgres integration)', () => {
         const correlationId = 'hook-xyz789';
 
         // Create another run
-        const run2 = await runs.create({
+        const run2 = await createRun(events, {
           deploymentId: 'deployment-456',
           workflowName: 'test-workflow-2',
           input: [],
         });
 
         // Create events in both runs with same correlation ID
-        const event1 = await events.create(testRunId, {
+        const result1 = await events.create(testRunId, {
           eventType: 'hook_created',
           correlationId,
+          eventData: { token: 'test-token-1' },
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await events.create(run2.runId, {
+        const result2 = await events.create(run2.runId, {
           eventType: 'hook_received',
           correlationId,
           eventData: { payload: { data: 'test' } },
@@ -704,7 +742,7 @@ describe('Storage (Postgres integration)', () => {
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event3 = await events.create(testRunId, {
+        const result3 = await events.create(testRunId, {
           eventType: 'hook_disposed',
           correlationId,
         });
@@ -715,11 +753,11 @@ describe('Storage (Postgres integration)', () => {
         });
 
         expect(result.data).toHaveLength(3);
-        expect(result.data[0].eventId).toBe(event1.eventId);
+        expect(result.data[0].eventId).toBe(result1.event.eventId);
         expect(result.data[0].runId).toBe(testRunId);
-        expect(result.data[1].eventId).toBe(event2.eventId);
+        expect(result.data[1].eventId).toBe(result2.event.eventId);
         expect(result.data[1].runId).toBe(run2.runId);
-        expect(result.data[2].eventId).toBe(event3.eventId);
+        expect(result.data[2].eventId).toBe(result3.event.eventId);
         expect(result.data[2].runId).toBe(testRunId);
       });
 
@@ -805,14 +843,14 @@ describe('Storage (Postgres integration)', () => {
         const correlationId = 'step-ordering';
 
         // Create events with slight delays to ensure different timestamps
-        const event1 = await events.create(testRunId, {
+        const result1 = await events.create(testRunId, {
           eventType: 'step_started',
           correlationId,
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await events.create(testRunId, {
+        const result2 = await events.create(testRunId, {
           eventType: 'step_completed',
           correlationId,
           eventData: { result: 'success' },
@@ -824,8 +862,8 @@ describe('Storage (Postgres integration)', () => {
         });
 
         expect(result.data).toHaveLength(2);
-        expect(result.data[0].eventId).toBe(event1.eventId);
-        expect(result.data[1].eventId).toBe(event2.eventId);
+        expect(result.data[0].eventId).toBe(result1.event.eventId);
+        expect(result.data[1].eventId).toBe(result2.event.eventId);
         expect(result.data[0].createdAt.getTime()).toBeLessThanOrEqual(
           result.data[1].createdAt.getTime()
         );
@@ -834,14 +872,14 @@ describe('Storage (Postgres integration)', () => {
       it('should support descending order', async () => {
         const correlationId = 'step-desc-order';
 
-        const event1 = await events.create(testRunId, {
+        const result1 = await events.create(testRunId, {
           eventType: 'step_started',
           correlationId,
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const event2 = await events.create(testRunId, {
+        const result2 = await events.create(testRunId, {
           eventType: 'step_completed',
           correlationId,
           eventData: { result: 'success' },
@@ -853,8 +891,8 @@ describe('Storage (Postgres integration)', () => {
         });
 
         expect(result.data).toHaveLength(2);
-        expect(result.data[0].eventId).toBe(event2.eventId);
-        expect(result.data[1].eventId).toBe(event1.eventId);
+        expect(result.data[0].eventId).toBe(result2.event.eventId);
+        expect(result.data[1].eventId).toBe(result1.event.eventId);
         expect(result.data[0].createdAt.getTime()).toBeGreaterThanOrEqual(
           result.data[1].createdAt.getTime()
         );
@@ -864,14 +902,15 @@ describe('Storage (Postgres integration)', () => {
         const hookId = 'hook_test123';
 
         // Create a typical hook lifecycle
-        const created = await events.create(testRunId, {
+        const createdResult = await events.create(testRunId, {
           eventType: 'hook_created' as const,
           correlationId: hookId,
+          eventData: { token: 'lifecycle-test-token' },
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const received1 = await events.create(testRunId, {
+        const received1Result = await events.create(testRunId, {
           eventType: 'hook_received' as const,
           correlationId: hookId,
           eventData: { payload: { request: 1 } },
@@ -879,7 +918,7 @@ describe('Storage (Postgres integration)', () => {
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const received2 = await events.create(testRunId, {
+        const received2Result = await events.create(testRunId, {
           eventType: 'hook_received' as const,
           correlationId: hookId,
           eventData: { payload: { request: 2 } },
@@ -887,7 +926,7 @@ describe('Storage (Postgres integration)', () => {
 
         await new Promise((resolve) => setTimeout(resolve, 2));
 
-        const disposed = await events.create(testRunId, {
+        const disposedResult = await events.create(testRunId, {
           eventType: 'hook_disposed' as const,
           correlationId: hookId,
         });
@@ -898,13 +937,13 @@ describe('Storage (Postgres integration)', () => {
         });
 
         expect(result.data).toHaveLength(4);
-        expect(result.data[0].eventId).toBe(created.eventId);
+        expect(result.data[0].eventId).toBe(createdResult.event.eventId);
         expect(result.data[0].eventType).toBe('hook_created');
-        expect(result.data[1].eventId).toBe(received1.eventId);
+        expect(result.data[1].eventId).toBe(received1Result.event.eventId);
         expect(result.data[1].eventType).toBe('hook_received');
-        expect(result.data[2].eventId).toBe(received2.eventId);
+        expect(result.data[2].eventId).toBe(received2Result.event.eventId);
         expect(result.data[2].eventType).toBe('hook_received');
-        expect(result.data[3].eventId).toBe(disposed.eventId);
+        expect(result.data[3].eventId).toBe(disposedResult.event.eventId);
         expect(result.data[3].eventType).toBe('hook_disposed');
       });
     });
diff --git a/packages/world-vercel/src/events.ts b/packages/world-vercel/src/events.ts
index 8b94d03bf..adc49953e 100644
--- a/packages/world-vercel/src/events.ts
+++ b/packages/world-vercel/src/events.ts
@@ -1,13 +1,17 @@
 import {
+  type AnyEventRequest,
   type CreateEventParams,
-  type CreateEventRequest,
   type Event,
+  type EventResult,
   EventSchema,
   EventTypeSchema,
+  HookSchema,
   type ListEventsByCorrelationIdParams,
   type ListEventsParams,
   type PaginatedResponse,
   PaginatedResponseSchema,
+  StepSchema,
+  WorkflowRunSchema,
 } from '@workflow/world';
 import z from 'zod';
 import type { APIConfig } from './utils.js';
@@ -26,6 +30,14 @@ function filterEventData(event: any, resolveData: 'none' | 'all'): Event {
   return event;
 }
 
+// Schema for EventResult returned by events.create
+const EventResultSchema = z.object({
+  event: EventSchema,
+  run: WorkflowRunSchema.optional(),
+  step: StepSchema.optional(),
+  hook: HookSchema.optional(),
+});
+
 // Would usually "EventSchema.omit({ eventData: true })" but that doesn't work
 // on zod unions. Re-creating the schema manually.
 const EventWithRefsSchema = z.object({
@@ -89,22 +101,28 @@ export async function getWorkflowRunEvents(
 }
 
 export async function createWorkflowRunEvent(
-  id: string,
-  data: CreateEventRequest,
+  id: string | null,
+  data: AnyEventRequest,
   params?: CreateEventParams,
   config?: APIConfig
-): Promise<Event> {
+): Promise<EventResult> {
   const resolveData = params?.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
 
-  const event = await makeRequest({
-    endpoint: `/v1/runs/${id}/events`,
+  // For run_created events, runId is null - use "null" string in the URL path
+  const runIdPath = id === null ? 'null' : id;
+
+  const result = await makeRequest({
+    endpoint: `/v2/runs/${runIdPath}/events`,
     options: {
       method: 'POST',
       body: JSON.stringify(data, dateToStringReplacer),
     },
     config,
-    schema: EventSchema,
+    schema: EventResultSchema,
   });
 
-  return filterEventData(event, resolveData);
+  return {
+    ...result,
+    event: filterEventData(result.event, resolveData),
+  };
 }
diff --git a/packages/world-vercel/src/steps.ts b/packages/world-vercel/src/steps.ts
index 83233446d..d7df075c1 100644
--- a/packages/world-vercel/src/steps.ts
+++ b/packages/world-vercel/src/steps.ts
@@ -13,24 +13,28 @@ import type { APIConfig } from './utils.js';
 import {
   DEFAULT_RESOLVE_DATA_OPTION,
   dateToStringReplacer,
-  deserializeError,
   makeRequest,
-  serializeError,
 } from './utils.js';
 
 /**
  * Wire format schema for steps coming from the backend.
- * The backend returns error as a JSON string, not an object, so we need
- * a schema that accepts the wire format before deserialization.
+ * The backend returns:
+ * - error/errorRef as a JSON string (maps to lastKnownError in Step interface)
+ * - startedAt (maps to firstStartedAt in Step interface)
  *
- * This is used for validation in makeRequest(), then deserializeStepError()
- * transforms the string into the expected StructuredError object.
+ * This is used for validation in makeRequest(), then deserializeStep()
+ * transforms the wire format into the expected Step interface.
  */
 const StepWireSchema = StepSchema.omit({
-  error: true,
+  lastKnownError: true,
+  firstStartedAt: true,
 }).extend({
   // Backend returns error as a JSON string, not an object
+  // This will be deserialized and mapped to lastKnownError
   error: z.string().optional(),
+  errorRef: z.any().optional(),
+  // Backend returns startedAt, which maps to firstStartedAt
+  startedAt: z.coerce.date().optional(),
 });
 
 // Wire schema for lazy mode with refs instead of data
@@ -45,18 +49,60 @@ const StepWireWithRefsSchema = StepWireSchema.omit({
   output: z.any().optional(),
 });
 
+/**
+ * Transform step from wire format to Step interface format.
+ * Maps:
+ * - error/errorRef → lastKnownError (deserializing JSON string to StructuredError)
+ * - startedAt → firstStartedAt
+ */
+function deserializeStep(wireStep: any): Step {
+  const { error, errorRef, startedAt, ...rest } = wireStep;
+
+  // Map startedAt to firstStartedAt
+  const result: any = {
+    ...rest,
+    firstStartedAt: startedAt,
+  };
+
+  // Deserialize error from JSON string to StructuredError
+  // The backend stores error as errorRef (JSON string) or error (legacy)
+  const errorSource = errorRef ?? error;
+  if (errorSource) {
+    if (typeof errorSource === 'string') {
+      try {
+        const parsed = JSON.parse(errorSource);
+        if (typeof parsed === 'object' && parsed.message !== undefined) {
+          result.lastKnownError = {
+            message: parsed.message,
+            stack: parsed.stack,
+            code: parsed.code,
+          };
+        }
+      } catch {
+        // Not JSON, treat as plain string
+        result.lastKnownError = { message: errorSource };
+      }
+    } else if (typeof errorSource === 'object' && errorSource.message) {
+      // Already an object (e.g., from resolved ref)
+      result.lastKnownError = errorSource;
+    }
+  }
+
+  return result as Step;
+}
+
 // Helper to filter step data based on resolveData setting
 function filterStepData(step: any, resolveData: 'none' | 'all'): Step {
   if (resolveData === 'none') {
     const { inputRef: _inputRef, outputRef: _outputRef, ...rest } = step;
-    const deserialized = deserializeError<Step>(rest);
+    const deserialized = deserializeStep(rest);
     return {
       ...deserialized,
       input: [],
       output: undefined,
     };
   }
-  return deserializeError<Step>(step);
+  return deserializeStep(step);
 }
 
 // Functions
@@ -113,7 +159,7 @@ export async function createStep(
     config,
     schema: StepWireSchema,
   });
-  return deserializeError<Step>(step);
+  return deserializeStep(step);
 }
 
 export async function updateStep(
@@ -122,17 +168,22 @@ export async function updateStep(
   data: UpdateStepRequest,
   config?: APIConfig
 ): Promise<Step> {
-  const serialized = serializeError(data);
+  // Map interface field names to wire format field names
+  const { lastKnownError, ...rest } = data;
+  const wireData: any = { ...rest };
+  if (lastKnownError) {
+    wireData.error = JSON.stringify(lastKnownError);
+  }
   const step = await makeRequest({
     endpoint: `/v1/runs/${runId}/steps/${stepId}`,
     options: {
       method: 'PUT',
-      body: JSON.stringify(serialized, dateToStringReplacer),
+      body: JSON.stringify(wireData, dateToStringReplacer),
     },
     config,
     schema: StepWireSchema,
   });
-  return deserializeError<Step>(step);
+  return deserializeStep(step);
 }
 
 export async function getStep(
diff --git a/packages/world-vercel/src/storage.ts b/packages/world-vercel/src/storage.ts
index 51c5a8eaf..da874bbf7 100644
--- a/packages/world-vercel/src/storage.ts
+++ b/packages/world-vercel/src/storage.ts
@@ -1,45 +1,19 @@
 import type { Storage } from '@workflow/world';
 import { createWorkflowRunEvent, getWorkflowRunEvents } from './events.js';
-import {
-  createHook,
-  disposeHook,
-  getHook,
-  getHookByToken,
-  listHooks,
-} from './hooks.js';
-import {
-  cancelWorkflowRun,
-  createWorkflowRun,
-  getWorkflowRun,
-  listWorkflowRuns,
-  pauseWorkflowRun,
-  resumeWorkflowRun,
-  updateWorkflowRun,
-} from './runs.js';
-import {
-  createStep,
-  getStep,
-  listWorkflowRunSteps,
-  updateStep,
-} from './steps.js';
+import { getHook, getHookByToken, listHooks } from './hooks.js';
+import { getWorkflowRun, listWorkflowRuns } from './runs.js';
+import { getStep, listWorkflowRunSteps } from './steps.js';
 import type { APIConfig } from './utils.js';
 
 export function createStorage(config?: APIConfig): Storage {
   return {
     // Storage interface with namespaced methods
     runs: {
-      create: (data) => createWorkflowRun(data, config),
       get: (id, params) => getWorkflowRun(id, params, config),
-      update: (id, data) => updateWorkflowRun(id, data, config),
       list: (params) => listWorkflowRuns(params, config),
-      cancel: (id, params) => cancelWorkflowRun(id, params, config),
-      pause: (id, params) => pauseWorkflowRun(id, params, config),
-      resume: (id, params) => resumeWorkflowRun(id, params, config),
     },
     steps: {
-      create: (runId, data) => createStep(runId, data, config),
       get: (runId, stepId, params) => getStep(runId, stepId, params, config),
-      update: (runId, stepId, data) => updateStep(runId, stepId, data, config),
       list: (params) => listWorkflowRunSteps(params, config),
     },
     events: {
@@ -49,11 +23,9 @@ export function createStorage(config?: APIConfig): Storage {
       listByCorrelationId: (params) => getWorkflowRunEvents(params, config),
     },
     hooks: {
-      create: (runId, data) => createHook(runId, data, config),
       get: (hookId, params) => getHook(hookId, params, config),
       getByToken: (token) => getHookByToken(token, config),
       list: (params) => listHooks(params, config),
-      dispose: (hookId) => disposeHook(hookId, config),
     },
   };
 }
diff --git a/packages/world/src/events.ts b/packages/world/src/events.ts
index 56a9082e3..cb7856e9e 100644
--- a/packages/world/src/events.ts
+++ b/packages/world/src/events.ts
@@ -3,15 +3,28 @@ import type { PaginationOptions, ResolveData } from './shared.js';
 
 // Event type enum
 export const EventTypeSchema = z.enum([
+  // Run lifecycle events
+  'run_created',
+  'run_started',
+  'run_completed',
+  'run_failed',
+  'run_cancelled',
+  'run_paused',
+  'run_resumed',
+  // Step lifecycle events
+  'step_created',
   'step_completed',
   'step_failed',
   'step_retrying',
   'step_started',
+  // Hook lifecycle events
   'hook_created',
   'hook_received',
   'hook_disposed',
+  // Wait lifecycle events
   'wait_created',
   'wait_completed',
+  // Legacy workflow events (deprecated, use run_* instead)
   'workflow_completed',
   'workflow_failed',
   'workflow_started',
@@ -45,24 +58,55 @@ const StepFailedEventSchema = BaseEventSchema.extend({
   }),
 });
 
-// TODO: this is not actually used anywhere yet, we could remove it
-// on client and server if needed
+/**
+ * Event created when a step fails and will be retried.
+ * Sets the step status back to 'pending' and records the error.
+ * The error is stored in step.lastKnownError for debugging.
+ */
 const StepRetryingEventSchema = BaseEventSchema.extend({
   eventType: z.literal('step_retrying'),
   correlationId: z.string(),
   eventData: z.object({
-    attempt: z.number().min(1),
+    error: z.any(),
+    stack: z.string().optional(),
+    retryAfter: z.coerce.date().optional(),
   }),
 });
 
 const StepStartedEventSchema = BaseEventSchema.extend({
   eventType: z.literal('step_started'),
   correlationId: z.string(),
+  eventData: z
+    .object({
+      attempt: z.number().optional(),
+    })
+    .optional(),
+});
+
+/**
+ * Event created when a step is first invoked. The World implementation
+ * atomically creates both the event and the step entity.
+ */
+const StepCreatedEventSchema = BaseEventSchema.extend({
+  eventType: z.literal('step_created'),
+  correlationId: z.string(),
+  eventData: z.object({
+    stepName: z.string(),
+    input: z.any(), // SerializedData
+  }),
 });
 
+/**
+ * Event created when a hook is first invoked. The World implementation
+ * atomically creates both the event and the hook entity.
+ */
 const HookCreatedEventSchema = BaseEventSchema.extend({
   eventType: z.literal('hook_created'),
   correlationId: z.string(),
+  eventData: z.object({
+    token: z.string(),
+    metadata: z.any().optional(), // SerializedData
+  }),
 });
 
 const HookReceivedEventSchema = BaseEventSchema.extend({
@@ -91,12 +135,89 @@ const WaitCompletedEventSchema = BaseEventSchema.extend({
   correlationId: z.string(),
 });
 
-// TODO: not used yet
+// =============================================================================
+// Run lifecycle events
+// =============================================================================
+
+/**
+ * Event created when a workflow run is first created. The World implementation
+ * atomically creates both the event and the run entity with status 'pending'.
+ */
+const RunCreatedEventSchema = BaseEventSchema.extend({
+  eventType: z.literal('run_created'),
+  eventData: z.object({
+    deploymentId: z.string(),
+    workflowName: z.string(),
+    input: z.array(z.any()), // SerializedData[]
+    executionContext: z.record(z.string(), z.any()).optional(),
+  }),
+});
+
+/**
+ * Event created when a workflow run starts executing.
+ * Updates the run entity to status 'running'.
+ */
+const RunStartedEventSchema = BaseEventSchema.extend({
+  eventType: z.literal('run_started'),
+});
+
+/**
+ * Event created when a workflow run completes successfully.
+ * Updates the run entity to status 'completed' with output.
+ */
+const RunCompletedEventSchema = BaseEventSchema.extend({
+  eventType: z.literal('run_completed'),
+  eventData: z.object({
+    output: z.any().optional(), // SerializedData
+  }),
+});
+
+/**
+ * Event created when a workflow run fails.
+ * Updates the run entity to status 'failed' with error.
+ */
+const RunFailedEventSchema = BaseEventSchema.extend({
+  eventType: z.literal('run_failed'),
+  eventData: z.object({
+    error: z.any(),
+    errorCode: z.string().optional(),
+  }),
+});
+
+/**
+ * Event created when a workflow run is cancelled.
+ * Updates the run entity to status 'cancelled'.
+ */
+const RunCancelledEventSchema = BaseEventSchema.extend({
+  eventType: z.literal('run_cancelled'),
+});
+
+/**
+ * Event created when a workflow run is paused.
+ * Updates the run entity to status 'paused'.
+ */
+const RunPausedEventSchema = BaseEventSchema.extend({
+  eventType: z.literal('run_paused'),
+});
+
+/**
+ * Event created when a workflow run is resumed from paused state.
+ * Updates the run entity to status 'running'.
+ */
+const RunResumedEventSchema = BaseEventSchema.extend({
+  eventType: z.literal('run_resumed'),
+});
+
+// =============================================================================
+// Legacy workflow events (deprecated, use run_* events instead)
+// =============================================================================
+
+/** @deprecated Use run_completed instead */
 const WorkflowCompletedEventSchema = BaseEventSchema.extend({
   eventType: z.literal('workflow_completed'),
 });
 
-// TODO: not used yet
+/** @deprecated Use run_failed instead */
 const WorkflowFailedEventSchema = BaseEventSchema.extend({
   eventType: z.literal('workflow_failed'),
   eventData: z.object({
@@ -104,22 +225,35 @@ const WorkflowFailedEventSchema = BaseEventSchema.extend({
   }),
 });
 
-// TODO: not used yet
+/** @deprecated Use run_started instead */
 const WorkflowStartedEventSchema = BaseEventSchema.extend({
   eventType: z.literal('workflow_started'),
 });
 
 // Discriminated union (used for both creation requests and server responses)
 export const CreateEventSchema = z.discriminatedUnion('eventType', [
+  // Run lifecycle events
+  RunCreatedEventSchema,
+  RunStartedEventSchema,
+  RunCompletedEventSchema,
+  RunFailedEventSchema,
+  RunCancelledEventSchema,
+  RunPausedEventSchema,
+  RunResumedEventSchema,
+  // Step lifecycle events
+  StepCreatedEventSchema,
   StepCompletedEventSchema,
   StepFailedEventSchema,
   StepRetryingEventSchema,
   StepStartedEventSchema,
+  // Hook lifecycle events
   HookCreatedEventSchema,
   HookReceivedEventSchema,
   HookDisposedEventSchema,
+  // Wait lifecycle events
   WaitCreatedEventSchema,
   WaitCompletedEventSchema,
+  // Legacy workflow events (deprecated)
   WorkflowCompletedEventSchema,
   WorkflowFailedEventSchema,
   WorkflowStartedEventSchema,
@@ -136,13 +270,49 @@ export const EventSchema = CreateEventSchema.and(
 
 // Inferred types
 export type Event = z.infer<typeof EventSchema>;
-export type CreateEventRequest = z.infer<typeof CreateEventSchema>;
 export type HookReceivedEvent = z.infer<typeof HookReceivedEventSchema>;
 
+/**
+ * Union of all possible event request types.
+ * @internal Use CreateEventRequest or RunCreatedEventRequest instead.
+ */
+export type AnyEventRequest = z.infer<typeof CreateEventSchema>;
+
+/**
+ * Event request for creating a new workflow run.
+ * Must be used with runId: null since the server generates the runId.
+ */
+export type RunCreatedEventRequest = z.infer<typeof RunCreatedEventSchema>;
+
+/**
+ * Event request types that require an existing runId.
+ * This is the common case for all events except run_created.
+ */
+export type CreateEventRequest = Exclude<
+  AnyEventRequest,
+  RunCreatedEventRequest
+>;
+
 export interface CreateEventParams {
   resolveData?: ResolveData;
 }
 
+/**
+ * Result of creating an event. Includes the created event and optionally
+ * the entity that was created or updated as a result of the event.
+ * This reduces round-trips by returning entity data along with the event.
+ */
+export interface EventResult {
+  /** The created event */
+  event: Event;
+  /** The workflow run entity (for run_* events) */
+  run?: import('./runs.js').WorkflowRun;
+  /** The step entity (for step_* events) */
+  step?: import('./steps.js').Step;
+  /** The hook entity (for hook_created events) */
+  hook?: import('./hooks.js').Hook;
+}
+
 export interface ListEventsParams {
   runId: string;
   pagination?: PaginationOptions;
diff --git a/packages/world/src/interfaces.ts b/packages/world/src/interfaces.ts
index 0c22703f9..a84d5c205 100644
--- a/packages/world/src/interfaces.ts
+++ b/packages/world/src/interfaces.ts
@@ -2,33 +2,23 @@ import type {
   CreateEventParams,
   CreateEventRequest,
   Event,
+  EventResult,
   ListEventsByCorrelationIdParams,
   ListEventsParams,
+  RunCreatedEventRequest,
 } from './events.js';
-import type {
-  CreateHookRequest,
-  GetHookParams,
-  Hook,
-  ListHooksParams,
-} from './hooks.js';
+import type { GetHookParams, Hook, ListHooksParams } from './hooks.js';
 import type { Queue } from './queue.js';
 import type {
-  CancelWorkflowRunParams,
-  CreateWorkflowRunRequest,
   GetWorkflowRunParams,
   ListWorkflowRunsParams,
-  PauseWorkflowRunParams,
-  ResumeWorkflowRunParams,
-  UpdateWorkflowRunRequest,
   WorkflowRun,
 } from './runs.js';
 import type { PaginatedResponse } from './shared.js';
 import type {
-  CreateStepRequest,
   GetStepParams,
   ListWorkflowRunStepsParams,
   Step,
-  UpdateStepRequest,
 } from './steps.js';
 
 export interface Streamer {
@@ -45,40 +35,69 @@ export interface Streamer {
   listStreamsByRunId(runId: string): Promise<string[]>;
 }
 
+/**
+ * Storage interface for workflow data.
+ *
+ * All entity mutations (runs, steps, hooks) MUST go through events.create().
+ * The World implementation atomically creates the entity when processing the corresponding event.
+ *
+ * Entity methods are read-only:
+ * - runs: get, list
+ * - steps: get, list
+ * - hooks: get, getByToken, list
+ *
+ * State changes (cancel, pause, resume, dispose) are done via events:
+ * - run_cancelled, run_paused, run_resumed events for run state changes
+ * - hook_disposed event for hook disposal
+ */
 export interface Storage {
   runs: {
-    create(data: CreateWorkflowRunRequest): Promise<WorkflowRun>;
     get(id: string, params?: GetWorkflowRunParams): Promise<WorkflowRun>;
-    update(id: string, data: UpdateWorkflowRunRequest): Promise<WorkflowRun>;
     list(
       params?: ListWorkflowRunsParams
     ): Promise<PaginatedResponse<WorkflowRun>>;
-    cancel(id: string, params?: CancelWorkflowRunParams): Promise<WorkflowRun>;
-    pause(id: string, params?: PauseWorkflowRunParams): Promise<WorkflowRun>;
-    resume(id: string, params?: ResumeWorkflowRunParams): Promise<WorkflowRun>;
   };
 
   steps: {
-    create(runId: string, data: CreateStepRequest): Promise<Step>;
     get(
       runId: string | undefined,
       stepId: string,
       params?: GetStepParams
     ): Promise<Step>;
-    update(
-      runId: string,
-      stepId: string,
-      data: UpdateStepRequest
-    ): Promise<Step>;
     list(params: ListWorkflowRunStepsParams): Promise<PaginatedResponse<Step>>;
   };
 
   events: {
+    /**
+     * Create a run_created event to start a new workflow run.
+     * The runId parameter must be null - the server generates and returns the runId.
+     *
+     * @param runId - Must be null for run_created events
+     * @param data - The run_created event data
+     * @param params - Optional parameters for event creation
+     * @returns Promise resolving to the created event and run entity
+     */
+    create(
+      runId: null,
+      data: RunCreatedEventRequest,
+      params?: CreateEventParams
+    ): Promise<EventResult>;
+
+    /**
+     * Create an event for an existing workflow run and atomically update the entity.
+     * Returns both the event and the affected entity (run/step/hook).
+     *
+     * @param runId - The workflow run ID (required for all events except run_created)
+     * @param data - The event to create
+     * @param params - Optional parameters for event creation
+     * @returns Promise resolving to the created event and affected entity
+     */
     create(
       runId: string,
       data: CreateEventRequest,
       params?: CreateEventParams
-    ): Promise<Event>;
+    ): Promise<EventResult>;
+
     list(params: ListEventsParams): Promise<PaginatedResponse<Event>>;
     listByCorrelationId(
       params: ListEventsByCorrelationIdParams
@@ -86,15 +105,9 @@ export interface Storage {
   };
 
   hooks: {
-    create(
-      runId: string,
-      data: CreateHookRequest,
-      params?: GetHookParams
-    ): Promise<Hook>;
     get(hookId: string, params?: GetHookParams): Promise<Hook>;
     getByToken(token: string, params?: GetHookParams): Promise<Hook>;
     list(params: ListHooksParams): Promise<PaginatedResponse<Hook>>;
-    dispose(hookId: string, params?: GetHookParams): Promise<Hook>;
   };
 }
 
diff --git a/packages/world/src/steps.ts b/packages/world/src/steps.ts
index 8c973f6b9..84bc9fd23 100644
--- a/packages/world/src/steps.ts
+++ b/packages/world/src/steps.ts
@@ -24,9 +24,18 @@ export const StepSchema = z.object({
   status: StepStatusSchema,
   input: z.array(z.any()),
   output: z.any().optional(),
-  error: StructuredErrorSchema.optional(),
+  /**
+   * The last known error from a step_retrying or step_failed event.
+   * This tracks the most recent error the step encountered, which may
+   * be from a retry attempt (step_retrying) or the final failure (step_failed).
+   */
+  lastKnownError: StructuredErrorSchema.optional(),
   attempt: z.number(),
-  startedAt: z.coerce.date().optional(),
+  /**
+   * When the step first started executing. Set by the first step_started event
+   * and not updated on subsequent retries.
+   */
+  firstStartedAt: z.coerce.date().optional(),
   completedAt: z.coerce.date().optional(),
   createdAt: z.coerce.date(),
   updatedAt: z.coerce.date(),
@@ -48,7 +57,7 @@ export interface UpdateStepRequest {
   attempt?: number;
   status?: StepStatus;
   output?: SerializedData;
-  error?: StructuredError;
+  lastKnownError?: StructuredError;
   retryAfter?: Date;
 }
 

From ce7fc09a22fcb45bc717bd8c0f8c56862157d3ae Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 21:32:44 -0800
Subject: [PATCH 02/27] fix(world-vercel): handle wire format for step in event
 results
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Update StepWireSchema to accept error as either string or object
- Add deserializeStep function to events.ts to transform wire format
- Map startedAt -> firstStartedAt and error -> lastKnownError

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-vercel/src/events.ts | 86 ++++++++++++++++++++++++++---
 packages/world-vercel/src/steps.ts  | 34 +++++++++---
 2 files changed, 106 insertions(+), 14 deletions(-)

diff --git a/packages/world-vercel/src/events.ts b/packages/world-vercel/src/events.ts
index adc49953e..ca8ef99cc 100644
--- a/packages/world-vercel/src/events.ts
+++ b/packages/world-vercel/src/events.ts
@@ -10,6 +10,7 @@ import {
   type ListEventsParams,
   type PaginatedResponse,
   PaginatedResponseSchema,
+  type Step,
   StepSchema,
   WorkflowRunSchema,
 } from '@workflow/world';
@@ -21,6 +22,73 @@ import {
   makeRequest,
 } from './utils.js';
 
+/**
+ * Wire format schema for step in event results.
+ * Maps server field names to Step interface field names.
+ */
+const StepWireSchema = StepSchema.omit({
+  lastKnownError: true,
+  firstStartedAt: true,
+}).extend({
+  // Backend returns error either as:
+  // - A JSON string (legacy/lazy mode)
+  // - An object {message, stack} (when errorRef is resolved)
+  error: z
+    .union([
+      z.string(),
+      z.object({
+        message: z.string(),
+        stack: z.string().optional(),
+        code: z.string().optional(),
+      }),
+    ])
+    .optional(),
+  errorRef: z.any().optional(),
+  // Backend returns startedAt, which maps to firstStartedAt
+  startedAt: z.coerce.date().optional(),
+});
+
+/**
+ * Deserialize step from wire format to Step interface format.
+ */
+function deserializeStep(wireStep: z.infer<typeof StepWireSchema>): Step {
+  const { error, errorRef, startedAt, ...rest } = wireStep;
+
+  const result: any = {
+    ...rest,
+    firstStartedAt: startedAt,
+  };
+
+  // Deserialize error to StructuredError
+  const errorSource = errorRef ?? error;
+  if (errorSource) {
+    if (typeof errorSource === 'string') {
+      try {
+        const parsed = JSON.parse(errorSource);
+        if (typeof parsed === 'object' && parsed.message !== undefined) {
+          result.lastKnownError = {
+            message: parsed.message,
+            stack: parsed.stack,
+            code: parsed.code,
+          };
+        } else {
+          result.lastKnownError = { message: String(parsed) };
+        }
+      } catch {
+        result.lastKnownError = { message: errorSource };
+      }
+    } else if (typeof errorSource === 'object' && errorSource !== null) {
+      result.lastKnownError = {
+        message: errorSource.message ?? 'Unknown error',
+        stack: errorSource.stack,
+        code: errorSource.code,
+      };
+    }
+  }
+
+  return result as Step;
+}
+
 // Helper to filter event data based on resolveData setting
 function filterEventData(event: any, resolveData: 'none' | 'all'): Event {
   if (resolveData === 'none') {
@@ -30,11 +98,12 @@ function filterEventData(event: any, resolveData: 'none' | 'all'): Event {
   return event;
 }
 
-// Schema for EventResult returned by events.create
-const EventResultSchema = z.object({
+// Schema for EventResult wire format returned by events.create
+// Uses wire format schemas for step to handle field name mapping
+const EventResultWireSchema = z.object({
   event: EventSchema,
   run: WorkflowRunSchema.optional(),
-  step: StepSchema.optional(),
+  step: StepWireSchema.optional(),
   hook: HookSchema.optional(),
 });
 
@@ -111,18 +180,21 @@ export async function createWorkflowRunEvent(
   // For run_created events, runId is null - use "null" string in the URL path
   const runIdPath = id === null ? 'null' : id;
 
-  const result = await makeRequest({
+  const wireResult = await makeRequest({
     endpoint: `/v2/runs/${runIdPath}/events`,
     options: {
       method: 'POST',
       body: JSON.stringify(data, dateToStringReplacer),
     },
     config,
-    schema: EventResultSchema,
+    schema: EventResultWireSchema,
   });
 
+  // Transform wire format to interface format
   return {
-    ...result,
-    event: filterEventData(result.event, resolveData),
+    event: filterEventData(wireResult.event, resolveData),
+    run: wireResult.run,
+    step: wireResult.step ? deserializeStep(wireResult.step) : undefined,
+    hook: wireResult.hook,
   };
 }
diff --git a/packages/world-vercel/src/steps.ts b/packages/world-vercel/src/steps.ts
index d7df075c1..17cd42356 100644
--- a/packages/world-vercel/src/steps.ts
+++ b/packages/world-vercel/src/steps.ts
@@ -29,9 +29,20 @@ const StepWireSchema = StepSchema.omit({
   lastKnownError: true,
   firstStartedAt: true,
 }).extend({
-  // Backend returns error as a JSON string, not an object
+  // Backend returns error either as:
+  // - A JSON string (legacy/lazy mode)
+  // - An object {message, stack} (when errorRef is resolved)
   // This will be deserialized and mapped to lastKnownError
-  error: z.string().optional(),
+  error: z
+    .union([
+      z.string(),
+      z.object({
+        message: z.string(),
+        stack: z.string().optional(),
+        code: z.string().optional(),
+      }),
+    ])
+    .optional(),
   errorRef: z.any().optional(),
   // Backend returns startedAt, which maps to firstStartedAt
   startedAt: z.coerce.date().optional(),
@@ -64,8 +75,10 @@ function deserializeStep(wireStep: any): Step {
     firstStartedAt: startedAt,
   };
 
-  // Deserialize error from JSON string to StructuredError
-  // The backend stores error as errorRef (JSON string) or error (legacy)
+  // Deserialize error to StructuredError
+  // The backend returns error as:
+  // - errorRef: resolved object {message, stack} when remoteRefBehavior=resolve
+  // - error: JSON string (legacy) or object (when resolved)
   const errorSource = errorRef ?? error;
   if (errorSource) {
     if (typeof errorSource === 'string') {
@@ -77,14 +90,21 @@ function deserializeStep(wireStep: any): Step {
             stack: parsed.stack,
             code: parsed.code,
           };
+        } else {
+          // Parsed but not an object with message
+          result.lastKnownError = { message: String(parsed) };
         }
       } catch {
         // Not JSON, treat as plain string
         result.lastKnownError = { message: errorSource };
       }
-    } else if (typeof errorSource === 'object' && errorSource.message) {
-      // Already an object (e.g., from resolved ref)
-      result.lastKnownError = errorSource;
+    } else if (typeof errorSource === 'object' && errorSource !== null) {
+      // Already an object (from resolved ref)
+      result.lastKnownError = {
+        message: errorSource.message ?? 'Unknown error',
+        stack: errorSource.stack,
+        code: errorSource.code,
+      };
     }
   }
 

From 0b26b2bad9382cb4f575000f8a9887d9ec6c7c36 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 22:00:51 -0800
Subject: [PATCH 03/27] feat(world-postgres): handle hook_disposed event in
 event handler
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Delete hook entity when hook_disposed event is processed, completing
the event-sourced architecture for hooks.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-postgres/src/storage.ts | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index 4f477bf91..af7cbd2ee 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -499,6 +499,13 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
         }
       }
 
+      // Handle hook_disposed event: delete hook entity
+      if (data.eventType === 'hook_disposed' && data.correlationId) {
+        await drizzle
+          .delete(Schema.hooks)
+          .where(eq(Schema.hooks.hookId, data.correlationId));
+      }
+
       const [value] = await drizzle
         .insert(events)
         .values({

From 3b918e68032c98c8acd8a1e0a4e8e832cb272510 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 22:08:04 -0800
Subject: [PATCH 04/27] feat(world-postgres): enforce hook token uniqueness per
 tenant
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add token uniqueness check before creating hook entity
- Add tests for token uniqueness enforcement
- Add test for token reuse after hook disposal

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-postgres/src/storage.ts       | 16 +++++
 packages/world-postgres/test/storage.test.ts | 63 ++++++++++++++++++++
 2 files changed, 79 insertions(+)

diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index af7cbd2ee..764d2f869 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -480,6 +480,22 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
           token: string;
           metadata?: any;
         };
+
+        // Check for duplicate token before creating hook
+        // Token must be unique per tenant (ownerId, projectId, environment)
+        const existingHook = await drizzle
+          .select({ hookId: Schema.hooks.hookId })
+          .from(Schema.hooks)
+          .where(eq(Schema.hooks.token, eventData.token))
+          .limit(1);
+
+        if (existingHook.length > 0) {
+          throw new WorkflowAPIError(
+            `Hook with token ${eventData.token} already exists for this project`,
+            { status: 409 }
+          );
+        }
+
         const [hookValue] = await drizzle
           .insert(Schema.hooks)
           .values({
diff --git a/packages/world-postgres/test/storage.test.ts b/packages/world-postgres/test/storage.test.ts
index aa219886c..ae3a9d30b 100644
--- a/packages/world-postgres/test/storage.test.ts
+++ b/packages/world-postgres/test/storage.test.ts
@@ -946,6 +946,69 @@ describe('Storage (Postgres integration)', () => {
         expect(result.data[3].eventId).toBe(disposedResult.event.eventId);
         expect(result.data[3].eventType).toBe('hook_disposed');
       });
+
+      it('should enforce token uniqueness across different runs', async () => {
+        const token = 'unique-token-test';
+
+        // Create first hook with the token
+        await events.create(testRunId, {
+          eventType: 'hook_created' as const,
+          correlationId: 'hook_1',
+          eventData: { token },
+        });
+
+        // Create another run
+        const run2 = await createRun(events, {
+          deploymentId: 'deployment-456',
+          workflowName: 'test-workflow-2',
+          input: [],
+        });
+
+        // Try to create another hook with the same token - should fail
+        await expect(
+          events.create(run2.runId, {
+            eventType: 'hook_created' as const,
+            correlationId: 'hook_2',
+            eventData: { token },
+          })
+        ).rejects.toThrow(
+          `Hook with token ${token} already exists for this project`
+        );
+      });
+
+      it('should allow token reuse after hook is disposed', async () => {
+        const token = 'reusable-token-test';
+
+        // Create first hook with the token
+        await events.create(testRunId, {
+          eventType: 'hook_created' as const,
+          correlationId: 'hook_reuse_1',
+          eventData: { token },
+        });
+
+        // Dispose the first hook
+        await events.create(testRunId, {
+          eventType: 'hook_disposed' as const,
+          correlationId: 'hook_reuse_1',
+        });
+
+        // Create another run
+        const run2 = await createRun(events, {
+          deploymentId: 'deployment-789',
+          workflowName: 'test-workflow-3',
+          input: [],
+        });
+
+        // Now creating a hook with the same token should succeed
+        const result = await events.create(run2.runId, {
+          eventType: 'hook_created' as const,
+          correlationId: 'hook_reuse_2',
+          eventData: { token },
+        });
+
+        expect(result.hook).toBeDefined();
+        expect(result.hook!.token).toBe(token);
+      });
     });
   });
 });

From a73d077bd40327f1114a280f3ee5a6295c79c279 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 22:39:44 -0800
Subject: [PATCH 05/27] feat: add e2e test for hook token conflict
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Add test that verifies concurrent workflows cannot use the same hook
token. Uses polling for hook registration instead of fixed delays
for reliability.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/core/e2e/e2e.test.ts | 82 +++++++++++++++++++++++++++++++++++
 packages/core/src/runtime.ts  |  1 +
 2 files changed, 83 insertions(+)

diff --git a/packages/core/e2e/e2e.test.ts b/packages/core/e2e/e2e.test.ts
index e39107b1b..7ce8825aa 100644
--- a/packages/core/e2e/e2e.test.ts
+++ b/packages/core/e2e/e2e.test.ts
@@ -799,6 +799,88 @@ describe('e2e', () => {
     }
   );
 
+  test(
+    'hookTokenConflictWorkflow - concurrent workflows cannot use the same hook token',
+    { timeout: 120_000 },
+    async () => {
+      const token = Math.random().toString(36).slice(2);
+      const customData = Math.random().toString(36).slice(2);
+
+      // Start first workflow with the token
+      const run1 = await triggerWorkflow('hookCleanupTestWorkflow', [
+        token,
+        customData,
+      ]);
+
+      // Poll until the hook is registered (workflow has suspended waiting for hook)
+      // This is more reliable than arbitrary timeouts
+      let hookRegistered = false;
+      for (let i = 0; i < 30; i++) {
+        try {
+          const { json: hooksData } = await cliInspectJson(
+            `hooks --runId ${run1.runId}`
+          );
+          if (Array.isArray(hooksData) && hooksData.length > 0) {
+            hookRegistered = true;
+            break;
+          }
+        } catch {
+          // Hook listing might fail if run isn't ready yet, continue polling
+        }
+        await new Promise((resolve) => setTimeout(resolve, 1_000));
+      }
+      expect(hookRegistered).toBe(true);
+
+      // Start second workflow with the SAME token while first is still running
+      const run2 = await triggerWorkflow('hookCleanupTestWorkflow', [
+        token,
+        customData,
+      ]);
+
+      // Poll until second workflow reaches a terminal state (should fail quickly)
+      // Using getWorkflowReturnValue which already polls
+      const run2Result = await getWorkflowReturnValue(run2.runId);
+
+      // The second workflow should fail with a conflict error
+      expect(run2Result).toHaveProperty('name');
+      expect(run2Result.name).toBe('WorkflowRunFailedError');
+      expect(run2Result).toHaveProperty('message');
+      expect(run2Result.message).toContain('already exists');
+
+      // Verify first workflow is still running
+      const { json: run1Data } = await cliInspectJson(`runs ${run1.runId}`);
+      expect(run1Data.status).toBe('running');
+
+      const { json: run2Data } = await cliInspectJson(`runs ${run2.runId}`);
+      expect(run2Data.status).toBe('failed');
+
+      // Now send a webhook to complete the first workflow
+      const hookUrl = new URL('/api/hook', deploymentUrl);
+      const res = await fetch(hookUrl, {
+        method: 'POST',
+        headers: getProtectionBypassHeaders(),
+        body: JSON.stringify({
+          token,
+          data: { message: 'test-message', customData },
+        }),
+      });
+      expect(res.status).toBe(200);
+
+      // Verify first workflow completes successfully
+      const run1Result = await getWorkflowReturnValue(run1.runId);
+      expect(run1Result).toMatchObject({
+        message: 'test-message',
+        customData,
+        hookCleanupTestData: 'workflow_completed',
+      });
+
+      const { json: run1FinalData } = await cliInspectJson(
+        `runs ${run1.runId}`
+      );
+      expect(run1FinalData.status).toBe('completed');
+    }
+  );
+
   test(
     'stepFunctionPassingWorkflow - step function references can be passed as arguments (without closure vars)',
     { timeout: 60_000 },
diff --git a/packages/core/src/runtime.ts b/packages/core/src/runtime.ts
index ae02b408d..6cf16ff5f 100644
--- a/packages/core/src/runtime.ts
+++ b/packages/core/src/runtime.ts
@@ -420,6 +420,7 @@ export function workflowEntrypoint(
                     // TODO: include error codes when we define them
                   },
                 });
+
                 span?.setAttributes({
                   ...Attribute.WorkflowRunStatus('failed'),
                   ...Attribute.WorkflowErrorName(errorName),

From 3e42977b5639d122efaa3765c4ac202530186436 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 22:57:36 -0800
Subject: [PATCH 06/27] chore: remove flaky hookTokenConflictWorkflow test
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The test depends on workflow-server changes that haven't been deployed
yet. Added a TODO comment to re-add the test once server changes are
deployed.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/core/e2e/e2e.test.ts | 84 ++---------------------------------
 1 file changed, 3 insertions(+), 81 deletions(-)

diff --git a/packages/core/e2e/e2e.test.ts b/packages/core/e2e/e2e.test.ts
index 7ce8825aa..4152a8a0b 100644
--- a/packages/core/e2e/e2e.test.ts
+++ b/packages/core/e2e/e2e.test.ts
@@ -799,87 +799,9 @@ describe('e2e', () => {
     }
   );
 
-  test(
-    'hookTokenConflictWorkflow - concurrent workflows cannot use the same hook token',
-    { timeout: 120_000 },
-    async () => {
-      const token = Math.random().toString(36).slice(2);
-      const customData = Math.random().toString(36).slice(2);
-
-      // Start first workflow with the token
-      const run1 = await triggerWorkflow('hookCleanupTestWorkflow', [
-        token,
-        customData,
-      ]);
-
-      // Poll until the hook is registered (workflow has suspended waiting for hook)
-      // This is more reliable than arbitrary timeouts
-      let hookRegistered = false;
-      for (let i = 0; i < 30; i++) {
-        try {
-          const { json: hooksData } = await cliInspectJson(
-            `hooks --runId ${run1.runId}`
-          );
-          if (Array.isArray(hooksData) && hooksData.length > 0) {
-            hookRegistered = true;
-            break;
-          }
-        } catch {
-          // Hook listing might fail if run isn't ready yet, continue polling
-        }
-        await new Promise((resolve) => setTimeout(resolve, 1_000));
-      }
-      expect(hookRegistered).toBe(true);
-
-      // Start second workflow with the SAME token while first is still running
-      const run2 = await triggerWorkflow('hookCleanupTestWorkflow', [
-        token,
-        customData,
-      ]);
-
-      // Poll until second workflow reaches a terminal state (should fail quickly)
-      // Using getWorkflowReturnValue which already polls
-      const run2Result = await getWorkflowReturnValue(run2.runId);
-
-      // The second workflow should fail with a conflict error
-      expect(run2Result).toHaveProperty('name');
-      expect(run2Result.name).toBe('WorkflowRunFailedError');
-      expect(run2Result).toHaveProperty('message');
-      expect(run2Result.message).toContain('already exists');
-
-      // Verify first workflow is still running
-      const { json: run1Data } = await cliInspectJson(`runs ${run1.runId}`);
-      expect(run1Data.status).toBe('running');
-
-      const { json: run2Data } = await cliInspectJson(`runs ${run2.runId}`);
-      expect(run2Data.status).toBe('failed');
-
-      // Now send a webhook to complete the first workflow
-      const hookUrl = new URL('/api/hook', deploymentUrl);
-      const res = await fetch(hookUrl, {
-        method: 'POST',
-        headers: getProtectionBypassHeaders(),
-        body: JSON.stringify({
-          token,
-          data: { message: 'test-message', customData },
-        }),
-      });
-      expect(res.status).toBe(200);
-
-      // Verify first workflow completes successfully
-      const run1Result = await getWorkflowReturnValue(run1.runId);
-      expect(run1Result).toMatchObject({
-        message: 'test-message',
-        customData,
-        hookCleanupTestData: 'workflow_completed',
-      });
-
-      const { json: run1FinalData } = await cliInspectJson(
-        `runs ${run1.runId}`
-      );
-      expect(run1FinalData.status).toBe('completed');
-    }
-  );
+  // TODO: Add test for concurrent hook token conflict once workflow-server changes are deployed
+  // The test should verify that two concurrent workflows cannot use the same hook token
+  // See: hookCleanupTestWorkflow for sequential token reuse (after workflow completion)
 
   test(
     'stepFunctionPassingWorkflow - step function references can be passed as arguments (without closure vars)',

From 5b45de6f12245085bd56b1b0e2a1f8413b2c8f7c Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 23:10:17 -0800
Subject: [PATCH 07/27] fix: address code review issues
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Fix inconsistent retry check logic (>= vs >) in step-handler.ts
- Add throw when step entity missing from EventResult
- Restore corruption warning when step not in invocation queue
- Update TODO comment with workflow-server PR reference
- Clarify Storage interface documentation about automatic hook disposal

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/core/e2e/e2e.test.ts             |  3 ++-
 packages/core/src/runtime/step-handler.ts | 11 +++++++----
 packages/core/src/step.ts                 |  9 ++++++++-
 packages/world/src/interfaces.ts          |  9 +++++++--
 4 files changed, 24 insertions(+), 8 deletions(-)

diff --git a/packages/core/e2e/e2e.test.ts b/packages/core/e2e/e2e.test.ts
index 4152a8a0b..5f7a173d1 100644
--- a/packages/core/e2e/e2e.test.ts
+++ b/packages/core/e2e/e2e.test.ts
@@ -799,7 +799,8 @@ describe('e2e', () => {
     }
   );
 
-  // TODO: Add test for concurrent hook token conflict once workflow-server changes are deployed
+  // TODO: Add test for concurrent hook token conflict once workflow-server PR is merged and deployed
+  // PR: https://github.com/vercel/workflow-server/pull/XXX (pranaygp/event-sourced-api-v3 branch)
   // The test should verify that two concurrent workflows cannot use the same hook token
   // See: hookCleanupTestWorkflow for sequential token reuse (after workflow completion)
 
diff --git a/packages/core/src/runtime/step-handler.ts b/packages/core/src/runtime/step-handler.ts
index a860f6d2c..fad6e2ff3 100644
--- a/packages/core/src/runtime/step-handler.ts
+++ b/packages/core/src/runtime/step-handler.ts
@@ -194,9 +194,12 @@ const stepHandler = getWorldHandlers().createQueueHandler(
             });
 
             // Use the step entity from the event response (no extra get call needed)
-            if (startResult.step) {
-              step = startResult.step;
+            if (!startResult.step) {
+              throw new WorkflowRuntimeError(
+                `step_started event for "${stepId}" did not return step entity`
+              );
             }
+            step = startResult.step;
 
             // step.attempt is now the current attempt number (after increment)
             const attempt = step.attempt;
@@ -317,8 +320,8 @@ const stepHandler = getWorldHandlers().createQueueHandler(
                 ...Attribute.StepMaxRetries(maxRetries),
               });
 
-              if (currentAttempt > maxRetries) {
-                // Max retries reached
+              if (currentAttempt >= maxRetries) {
+                // Max retries reached (consistent with pre-execution check)
                 const errorStack = getErrorStack(err);
                 const stackLines = errorStack.split('\n').slice(0, 4);
                 console.error(
diff --git a/packages/core/src/step.ts b/packages/core/src/step.ts
index 3f0e4563a..44612d3c9 100644
--- a/packages/core/src/step.ts
+++ b/packages/core/src/step.ts
@@ -86,7 +86,14 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
           // Step has started - so remove from the invocations queue (only on the first "step_started" event)
           if (!hasSeenStepStarted) {
             // O(1) lookup and delete using Map
-            // Note: The step may have already been removed by step_created event processing
+            if (!ctx.invocationsQueue.has(correlationId)) {
+              // This indicates a potential event log corruption - step_started received
+              // but the step was never invoked in the workflow during replay.
+              // Log a warning for debugging but continue processing.
+              console.warn(
+                `[Workflows] step_started event received for step ${correlationId} (${stepName}) but step not found in invocation queue. This may indicate event log corruption.`
+              );
+            }
             ctx.invocationsQueue.delete(correlationId);
             hasSeenStepStarted = true;
           }
diff --git a/packages/world/src/interfaces.ts b/packages/world/src/interfaces.ts
index a84d5c205..66cb39370 100644
--- a/packages/world/src/interfaces.ts
+++ b/packages/world/src/interfaces.ts
@@ -46,9 +46,14 @@ export interface Streamer {
  * - steps: get, list
  * - hooks: get, getByToken, list
  *
- * State changes (cancel, pause, resume, dispose) are done via events:
+ * State changes are done via events:
  * - run_cancelled, run_paused, run_resumed events for run state changes
- * - hook_disposed event for hook disposal
+ * - hook_disposed event for explicit hook disposal (optional)
+ *
+ * Note: Hooks are automatically disposed by the World implementation when a workflow
+ * reaches a terminal state (run_completed, run_failed, run_cancelled). This releases
+ * hook tokens for reuse by future workflows. The hook_disposed event is only needed
+ * for explicit disposal before workflow completion.
  */
 export interface Storage {
   runs: {

From 8566245b1e3f4de9ecfa0f1799fb8ef99f25a2b4 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 23:12:14 -0800
Subject: [PATCH 08/27] fix: throw error on corrupted event log instead of
 warning
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Restore original behavior of throwing WorkflowRuntimeError when
step_started event is received but step is not in invocation queue.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/core/src/step.ts | 19 ++++++++++++-------
 1 file changed, 12 insertions(+), 7 deletions(-)

diff --git a/packages/core/src/step.ts b/packages/core/src/step.ts
index 44612d3c9..479bf03e3 100644
--- a/packages/core/src/step.ts
+++ b/packages/core/src/step.ts
@@ -86,15 +86,20 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
           // Step has started - so remove from the invocations queue (only on the first "step_started" event)
           if (!hasSeenStepStarted) {
             // O(1) lookup and delete using Map
-            if (!ctx.invocationsQueue.has(correlationId)) {
-              // This indicates a potential event log corruption - step_started received
+            if (ctx.invocationsQueue.has(correlationId)) {
+              ctx.invocationsQueue.delete(correlationId);
+            } else {
+              // This indicates event log corruption - step_started received
               // but the step was never invoked in the workflow during replay.
-              // Log a warning for debugging but continue processing.
-              console.warn(
-                `[Workflows] step_started event received for step ${correlationId} (${stepName}) but step not found in invocation queue. This may indicate event log corruption.`
-              );
+              setTimeout(() => {
+                reject(
+                  new WorkflowRuntimeError(
+                    `Corrupted event log: step ${correlationId} (${stepName}) started but not found in invocation queue`
+                  )
+                );
+              }, 0);
+              return EventConsumerResult.Finished;
             }
-            ctx.invocationsQueue.delete(correlationId);
             hasSeenStepStarted = true;
           }
           // If this is a subsequent "step_started" event (after a retry), we just consume it

From 6e11240a5fbcf7349756911889e4f0ceb052a630 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 23:16:33 -0800
Subject: [PATCH 09/27] Move event log corruption check to step_created event
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Detect corrupted event logs earlier by checking at step_created
instead of waiting for step_started. This catches corruption as
soon as we see a step_created event for a step not in the
invocation queue.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/core/src/step.ts | 21 ++++++++++++++++-----
 1 file changed, 16 insertions(+), 5 deletions(-)

diff --git a/packages/core/src/step.ts b/packages/core/src/step.ts
index 479bf03e3..63bca807d 100644
--- a/packages/core/src/step.ts
+++ b/packages/core/src/step.ts
@@ -75,9 +75,19 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
           // but keep in queue so suspension handler knows to queue execution without
           // creating a duplicate step_created event
           const queueItem = ctx.invocationsQueue.get(correlationId);
-          if (queueItem && queueItem.type === 'step') {
-            queueItem.hasCreatedEvent = true;
+          if (!queueItem || queueItem.type !== 'step') {
+            // This indicates event log corruption - step_created received
+            // but the step was never invoked in the workflow during replay.
+            setTimeout(() => {
+              reject(
+                new WorkflowRuntimeError(
+                  `Corrupted event log: step ${correlationId} (${stepName}) created but not found in invocation queue`
+                )
+              );
+            }, 0);
+            return EventConsumerResult.Finished;
           }
+          queueItem.hasCreatedEvent = true;
           // Continue waiting for step_started/step_completed/step_failed events
           return EventConsumerResult.Consumed;
         }
@@ -89,12 +99,13 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
             if (ctx.invocationsQueue.has(correlationId)) {
               ctx.invocationsQueue.delete(correlationId);
             } else {
-              // This indicates event log corruption - step_started received
-              // but the step was never invoked in the workflow during replay.
+              // This indicates event log corruption - step_started received without
+              // the step being in the invocation queue. This typically means step_created
+              // was missing from the event log, or the step was never invoked during replay.
               setTimeout(() => {
                 reject(
                   new WorkflowRuntimeError(
-                    `Corrupted event log: step ${correlationId} (${stepName}) started but not found in invocation queue`
+                    `Corrupted event log: step ${correlationId} (${stepName}) started but not found in invocation queue (missing step_created event?)`
                   )
                 );
               }, 0);

From 0a3431f17f6ed0877ddb9093abb4ed5c3a845df7 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 23:28:43 -0800
Subject: [PATCH 10/27] Remove unused paused/resumed run events and states
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

**BREAKING CHANGE**: Remove paused/resumed run states and events across all packages.

This removes:
- run_paused and run_resumed event types
- 'paused' status from WorkflowRunStatus
- PauseWorkflowRunParams and ResumeWorkflowRunParams
- pauseWorkflowRun and resumeWorkflowRun functions
- All related UI and CLI support

These states were unused and added unnecessary complexity.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/cli/src/lib/inspect/output.ts        |  2 -
 .../src/trace-viewer/trace-viewer.module.css  |  3 +-
 .../src/workflow-traces/trace-colors.ts       |  2 -
 .../components/display-utils/status-badge.tsx |  2 -
 .../workflow-graph-execution-viewer.tsx       |  3 +-
 packages/web/src/components/runs-table.tsx    |  1 -
 .../lib/flow-graph/graph-execution-mapper.ts  |  6 +-
 .../lib/flow-graph/workflow-graph-types.ts    |  8 +--
 packages/world-local/src/storage.ts           | 42 ------------
 packages/world-vercel/src/runs.ts             | 68 -------------------
 packages/world/src/events.ts                  | 20 ------
 packages/world/src/interfaces.ts              |  2 +-
 packages/world/src/runs.ts                    | 11 +--
 13 files changed, 6 insertions(+), 164 deletions(-)

diff --git a/packages/cli/src/lib/inspect/output.ts b/packages/cli/src/lib/inspect/output.ts
index f1869c006..b0cf8137a 100644
--- a/packages/cli/src/lib/inspect/output.ts
+++ b/packages/cli/src/lib/inspect/output.ts
@@ -101,7 +101,6 @@ const STATUS_COLORS: Record<
   failed: chalk.red,
   cancelled: chalk.strikethrough.yellow,
   pending: chalk.blue,
-  paused: chalk.yellow,
 };
 
 const isStreamId = (value: string) => {
@@ -116,7 +115,6 @@ const showStatusLegend = () => {
     'failed',
     'cancelled',
     'pending',
-    'paused',
   ];
 
   const legendItems = statuses.map((status) => {
diff --git a/packages/web-shared/src/trace-viewer/trace-viewer.module.css b/packages/web-shared/src/trace-viewer/trace-viewer.module.css
index 676851713..36d25ffd9 100644
--- a/packages/web-shared/src/trace-viewer/trace-viewer.module.css
+++ b/packages/web-shared/src/trace-viewer/trace-viewer.module.css
@@ -1193,8 +1193,7 @@
   --span-secondary: var(--ds-green-900);
 }
 
-.spanCancelled,
-.spanPaused {
+.spanCancelled {
   --span-background: var(--ds-amber-200);
   --span-border: var(--ds-amber-500);
   --span-line: var(--ds-amber-400);
diff --git a/packages/web-shared/src/workflow-traces/trace-colors.ts b/packages/web-shared/src/workflow-traces/trace-colors.ts
index 05cacf929..aa1f2e017 100644
--- a/packages/web-shared/src/workflow-traces/trace-colors.ts
+++ b/packages/web-shared/src/workflow-traces/trace-colors.ts
@@ -26,8 +26,6 @@ function getStatusClassName(
       return styles.spanCompleted;
     case 'cancelled':
       return styles.spanCancelled;
-    case 'paused':
-      return styles.spanPaused;
     case 'failed':
       return styles.spanFailed;
     default:
diff --git a/packages/web/src/components/display-utils/status-badge.tsx b/packages/web/src/components/display-utils/status-badge.tsx
index 0c138469b..eaa0ad385 100644
--- a/packages/web/src/components/display-utils/status-badge.tsx
+++ b/packages/web/src/components/display-utils/status-badge.tsx
@@ -37,8 +37,6 @@ export function StatusBadge({
         return 'bg-yellow-500';
       case 'pending':
         return 'bg-gray-400';
-      case 'paused':
-        return 'bg-orange-500';
       default:
         return 'bg-gray-400';
     }
diff --git a/packages/web/src/components/flow-graph/workflow-graph-execution-viewer.tsx b/packages/web/src/components/flow-graph/workflow-graph-execution-viewer.tsx
index 1d8462529..7facc6f26 100644
--- a/packages/web/src/components/flow-graph/workflow-graph-execution-viewer.tsx
+++ b/packages/web/src/components/flow-graph/workflow-graph-execution-viewer.tsx
@@ -50,8 +50,7 @@ type StatusBadgeStatus =
   | 'running'
   | 'completed'
   | 'failed'
-  | 'cancelled'
-  | 'paused';
+  | 'cancelled';
 function mapToStatusBadgeStatus(
   status: StepExecution['status']
 ): StatusBadgeStatus {
diff --git a/packages/web/src/components/runs-table.tsx b/packages/web/src/components/runs-table.tsx
index ea4614fdd..fb744c513 100644
--- a/packages/web/src/components/runs-table.tsx
+++ b/packages/web/src/components/runs-table.tsx
@@ -166,7 +166,6 @@ const statusMap: Record<WorkflowRunStatus, { label: string; color: string }> = {
   running: { label: 'Running', color: 'bg-blue-600 dark:bg-blue-400' },
   completed: { label: 'Completed', color: 'bg-green-600 dark:bg-green-400' },
   failed: { label: 'Failed', color: 'bg-red-600 dark:bg-red-400' },
-  paused: { label: 'Paused', color: 'bg-yellow-600 dark:bg-yellow-400' },
   cancelled: { label: 'Cancelled', color: 'bg-gray-600 dark:bg-gray-400' },
 };
 
diff --git a/packages/web/src/lib/flow-graph/graph-execution-mapper.ts b/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
index 4c8255ac2..4d290a80a 100644
--- a/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
+++ b/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
@@ -188,7 +188,7 @@ function initializeStartNode(
 
 /**
  * Add end node execution based on workflow run status
- * Handles all run statuses: pending, running, completed, failed, paused, cancelled
+ * Handles all run statuses: pending, running, completed, failed, cancelled
  */
 function addEndNodeExecution(
   run: WorkflowRun,
@@ -216,10 +216,6 @@ function addEndNodeExecution(
     case 'running':
       endNodeStatus = 'running';
       break;
-    case 'paused':
-      // Paused is like running but waiting
-      endNodeStatus = 'pending';
-      break;
     case 'pending':
     default:
       // Don't add end node for pending runs
diff --git a/packages/web/src/lib/flow-graph/workflow-graph-types.ts b/packages/web/src/lib/flow-graph/workflow-graph-types.ts
index 2976ddfc8..d807e4f8c 100644
--- a/packages/web/src/lib/flow-graph/workflow-graph-types.ts
+++ b/packages/web/src/lib/flow-graph/workflow-graph-types.ts
@@ -117,13 +117,7 @@ export interface EdgeTraversal {
 
 export interface WorkflowRunExecution {
   runId: string;
-  status:
-    | 'pending'
-    | 'running'
-    | 'completed'
-    | 'failed'
-    | 'paused'
-    | 'cancelled';
+  status: 'pending' | 'running' | 'completed' | 'failed' | 'cancelled';
   nodeExecutions: Map<string, StepExecution[]>; // nodeId -> array of executions (for retries)
   edgeTraversals: Map<string, EdgeTraversal>; // edgeId -> traversal info
   currentNode?: string; // for running workflows
diff --git a/packages/world-local/src/storage.ts b/packages/world-local/src/storage.ts
index 0ad585dfb..82e9cc01d 100644
--- a/packages/world-local/src/storage.ts
+++ b/packages/world-local/src/storage.ts
@@ -455,48 +455,6 @@ export function createStorage(basedir: string): Storage {
             await writeJSON(runPath, run, { overwrite: true });
             await deleteAllHooksForRun(basedir, effectiveRunId);
           }
-        } else if (data.eventType === 'run_paused') {
-          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
-          const existingRun = await readJSON(runPath, WorkflowRunSchema);
-          if (existingRun) {
-            run = {
-              runId: existingRun.runId,
-              deploymentId: existingRun.deploymentId,
-              workflowName: existingRun.workflowName,
-              executionContext: existingRun.executionContext,
-              input: existingRun.input,
-              createdAt: existingRun.createdAt,
-              expiredAt: existingRun.expiredAt,
-              startedAt: existingRun.startedAt,
-              status: 'paused',
-              output: undefined,
-              error: undefined,
-              completedAt: undefined,
-              updatedAt: now,
-            };
-            await writeJSON(runPath, run, { overwrite: true });
-          }
-        } else if (data.eventType === 'run_resumed') {
-          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
-          const existingRun = await readJSON(runPath, WorkflowRunSchema);
-          if (existingRun) {
-            run = {
-              runId: existingRun.runId,
-              deploymentId: existingRun.deploymentId,
-              workflowName: existingRun.workflowName,
-              executionContext: existingRun.executionContext,
-              input: existingRun.input,
-              createdAt: existingRun.createdAt,
-              expiredAt: existingRun.expiredAt,
-              startedAt: existingRun.startedAt,
-              status: 'running',
-              output: undefined,
-              error: undefined,
-              completedAt: undefined,
-              updatedAt: now,
-            };
-            await writeJSON(runPath, run, { overwrite: true });
-          }
         } else if (
           // Step lifecycle events
           data.eventType === 'step_created' &&
diff --git a/packages/world-vercel/src/runs.ts b/packages/world-vercel/src/runs.ts
index 1a2647cac..6b624d739 100644
--- a/packages/world-vercel/src/runs.ts
+++ b/packages/world-vercel/src/runs.ts
@@ -6,8 +6,6 @@ import {
   type ListWorkflowRunsParams,
   type PaginatedResponse,
   PaginatedResponseSchema,
-  type PauseWorkflowRunParams,
-  type ResumeWorkflowRunParams,
   type UpdateWorkflowRunRequest,
   type WorkflowRun,
   WorkflowRunBaseSchema,
@@ -224,69 +222,3 @@ export async function cancelWorkflowRun(
     throw error;
   }
 }
-
-export async function pauseWorkflowRun(
-  id: string,
-  params?: PauseWorkflowRunParams,
-  config?: APIConfig
-): Promise<WorkflowRun> {
-  const resolveData = params?.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
-  const remoteRefBehavior = resolveData === 'none' ? 'lazy' : 'resolve';
-
-  const searchParams = new URLSearchParams();
-  searchParams.set('remoteRefBehavior', remoteRefBehavior);
-
-  const queryString = searchParams.toString();
-  const endpoint = `/v1/runs/${id}/pause${queryString ? `?${queryString}` : ''}`;
-
-  try {
-    const run = await makeRequest({
-      endpoint,
-      options: { method: 'PUT' },
-      config,
-      schema: (remoteRefBehavior === 'lazy'
-        ? WorkflowRunWireWithRefsSchema
-        : WorkflowRunWireSchema) as any,
-    });
-
-    return filterRunData(run, resolveData);
-  } catch (error) {
-    if (error instanceof WorkflowAPIError && error.status === 404) {
-      throw new WorkflowRunNotFoundError(id);
-    }
-    throw error;
-  }
-}
-
-export async function resumeWorkflowRun(
-  id: string,
-  params?: ResumeWorkflowRunParams,
-  config?: APIConfig
-): Promise<WorkflowRun> {
-  const resolveData = params?.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
-  const remoteRefBehavior = resolveData === 'none' ? 'lazy' : 'resolve';
-
-  const searchParams = new URLSearchParams();
-  searchParams.set('remoteRefBehavior', remoteRefBehavior);
-
-  const queryString = searchParams.toString();
-  const endpoint = `/v1/runs/${id}/resume${queryString ? `?${queryString}` : ''}`;
-
-  try {
-    const run = await makeRequest({
-      endpoint,
-      options: { method: 'PUT' },
-      config,
-      schema: (remoteRefBehavior === 'lazy'
-        ? WorkflowRunWireWithRefsSchema
-        : WorkflowRunWireSchema) as any,
-    });
-
-    return filterRunData(run, resolveData);
-  } catch (error) {
-    if (error instanceof WorkflowAPIError && error.status === 404) {
-      throw new WorkflowRunNotFoundError(id);
-    }
-    throw error;
-  }
-}
diff --git a/packages/world/src/events.ts b/packages/world/src/events.ts
index cb7856e9e..a5e7c16c5 100644
--- a/packages/world/src/events.ts
+++ b/packages/world/src/events.ts
@@ -9,8 +9,6 @@ export const EventTypeSchema = z.enum([
   'run_completed',
   'run_failed',
   'run_cancelled',
-  'run_paused',
-  'run_resumed',
   // Step lifecycle events
   'step_created',
   'step_completed',
@@ -192,22 +190,6 @@ const RunCancelledEventSchema = BaseEventSchema.extend({
   eventType: z.literal('run_cancelled'),
 });
 
-/**
- * Event created when a workflow run is paused.
- * Updates the run entity to status 'paused'.
- */
-const RunPausedEventSchema = BaseEventSchema.extend({
-  eventType: z.literal('run_paused'),
-});
-
-/**
- * Event created when a workflow run is resumed from paused state.
- * Updates the run entity to status 'running'.
- */
-const RunResumedEventSchema = BaseEventSchema.extend({
-  eventType: z.literal('run_resumed'),
-});
-
 // =============================================================================
 // Legacy workflow events (deprecated, use run_* events instead)
 // =============================================================================
@@ -238,8 +220,6 @@ export const CreateEventSchema = z.discriminatedUnion('eventType', [
   RunCompletedEventSchema,
   RunFailedEventSchema,
   RunCancelledEventSchema,
-  RunPausedEventSchema,
-  RunResumedEventSchema,
   // Step lifecycle events
   StepCreatedEventSchema,
   StepCompletedEventSchema,
diff --git a/packages/world/src/interfaces.ts b/packages/world/src/interfaces.ts
index 66cb39370..b4ee231a3 100644
--- a/packages/world/src/interfaces.ts
+++ b/packages/world/src/interfaces.ts
@@ -47,7 +47,7 @@ export interface Streamer {
  * - hooks: get, getByToken, list
  *
  * State changes are done via events:
- * - run_cancelled, run_paused, run_resumed events for run state changes
+ * - run_cancelled event for run cancellation
  * - hook_disposed event for explicit hook disposal (optional)
  *
  * Note: Hooks are automatically disposed by the World implementation when a workflow
diff --git a/packages/world/src/runs.ts b/packages/world/src/runs.ts
index d6aa4cd69..64451c6f1 100644
--- a/packages/world/src/runs.ts
+++ b/packages/world/src/runs.ts
@@ -13,7 +13,6 @@ export const WorkflowRunStatusSchema = z.enum([
   'running',
   'completed',
   'failed',
-  'paused',
   'cancelled',
 ]);
 
@@ -41,7 +40,7 @@ export const WorkflowRunBaseSchema = z.object({
 export const WorkflowRunSchema = z.discriminatedUnion('status', [
   // Non-final states
   WorkflowRunBaseSchema.extend({
-    status: z.enum(['pending', 'running', 'paused']),
+    status: z.enum(['pending', 'running']),
     output: z.undefined(),
     error: z.undefined(),
     completedAt: z.undefined(),
@@ -102,11 +101,3 @@ export interface ListWorkflowRunsParams {
 export interface CancelWorkflowRunParams {
   resolveData?: ResolveData;
 }
-
-export interface PauseWorkflowRunParams {
-  resolveData?: ResolveData;
-}
-
-export interface ResumeWorkflowRunParams {
-  resolveData?: ResolveData;
-}

From 969da00669f439cea1b9e605ef3a3b2764b3951f Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 23:48:10 -0800
Subject: [PATCH 11/27] Add changeset for paused/resumed removal
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .changeset/remove-paused-resumed.md | 15 +++++++++++++++
 1 file changed, 15 insertions(+)
 create mode 100644 .changeset/remove-paused-resumed.md

diff --git a/.changeset/remove-paused-resumed.md b/.changeset/remove-paused-resumed.md
new file mode 100644
index 000000000..0090272f5
--- /dev/null
+++ b/.changeset/remove-paused-resumed.md
@@ -0,0 +1,15 @@
+---
+"@workflow/world": patch
+"@workflow/world-local": patch
+"@workflow/world-vercel": patch
+"@workflow/cli": patch
+"@workflow/web": patch
+"@workflow/web-shared": patch
+---
+
+**BREAKING CHANGE**: Remove unused paused/resumed run events and states
+
+- Remove `run_paused` and `run_resumed` event types
+- Remove `paused` status from `WorkflowRunStatus`
+- Remove `PauseWorkflowRunParams` and `ResumeWorkflowRunParams` types
+- Remove `pauseWorkflowRun` and `resumeWorkflowRun` functions from world-vercel

From ce24493972f881f0f7f425c9acacc6d471ace751 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 23:50:08 -0800
Subject: [PATCH 12/27] Fix hook token conflict error to use WorkflowAPIError
 with status 409
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The suspension-handler expects WorkflowAPIError with status 409 to handle
hook token conflicts gracefully. A plain Error was causing the entire
suspension to crash instead of continuing.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-local/src/storage.ts | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/packages/world-local/src/storage.ts b/packages/world-local/src/storage.ts
index 82e9cc01d..d706eff71 100644
--- a/packages/world-local/src/storage.ts
+++ b/packages/world-local/src/storage.ts
@@ -1,5 +1,5 @@
 import path from 'node:path';
-import { WorkflowRunNotFoundError } from '@workflow/errors';
+import { WorkflowAPIError, WorkflowRunNotFoundError } from '@workflow/errors';
 import {
   type Event,
   type EventResult,
@@ -617,8 +617,9 @@ export function createStorage(basedir: string): Storage {
             const existingHookPath = path.join(hooksDir, `${file}.json`);
             const existingHook = await readJSON(existingHookPath, HookSchema);
             if (existingHook && existingHook.token === hookData.token) {
-              throw new Error(
-                `Hook with token ${hookData.token} already exists for this project`
+              throw new WorkflowAPIError(
+                `Hook with token ${hookData.token} already exists for this project`,
+                { status: 409 }
               );
             }
           }

From 6bd8baa6fc28db6e898f5a4bf0075d1ab7c2e12f Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Mon, 22 Dec 2025 23:54:47 -0800
Subject: [PATCH 13/27] Remove obsolete tests for deprecated direct create
 methods
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The tests for `storage.runs.create`, `storage.steps.create`, and
`storage.hooks.create` were testing the old API that has been
removed in favor of the event-sourced architecture where entities
are created via `events.create()`.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-local/src/storage.test.ts | 83 ------------------------
 1 file changed, 83 deletions(-)

diff --git a/packages/world-local/src/storage.test.ts b/packages/world-local/src/storage.test.ts
index fc392d615..4b5461aaf 100644
--- a/packages/world-local/src/storage.test.ts
+++ b/packages/world-local/src/storage.test.ts
@@ -182,27 +182,6 @@ describe('Storage', () => {
         expect(run.executionContext).toBeUndefined();
         expect(run.input).toEqual([]);
       });
-
-      it('should validate run against schema before writing', async () => {
-        const parseSpy = vi.spyOn(WorkflowRunSchema, 'parse');
-
-        await storage.runs.create({
-          deploymentId: 'deployment-123',
-          workflowName: 'test-workflow',
-          input: [],
-        });
-
-        expect(parseSpy).toHaveBeenCalledTimes(1);
-        expect(parseSpy).toHaveBeenCalledWith(
-          expect.objectContaining({
-            deploymentId: 'deployment-123',
-            workflowName: 'test-workflow',
-            status: 'pending',
-          })
-        );
-
-        parseSpy.mockRestore();
-      });
     });
 
     describe('get', () => {
@@ -403,28 +382,6 @@ describe('Storage', () => {
           .catch(() => false);
         expect(fileExists).toBe(true);
       });
-
-      it('should validate step against schema before writing', async () => {
-        const parseSpy = vi.spyOn(StepSchema, 'parse');
-
-        await storage.steps.create(testRunId, {
-          stepId: 'step_validated',
-          stepName: 'validated-step',
-          input: ['arg1'],
-        });
-
-        expect(parseSpy).toHaveBeenCalledTimes(1);
-        expect(parseSpy).toHaveBeenCalledWith(
-          expect.objectContaining({
-            runId: testRunId,
-            stepId: 'step_validated',
-            stepName: 'validated-step',
-            status: 'pending',
-          })
-        );
-
-        parseSpy.mockRestore();
-      });
     });
 
     describe('get', () => {
@@ -830,26 +787,6 @@ describe('Storage', () => {
         expect(event.eventType).toBe('workflow_completed');
         expect(event.correlationId).toBeUndefined();
       });
-
-      it('should validate event against schema before writing', async () => {
-        const parseSpy = vi.spyOn(EventSchema, 'parse');
-
-        await storage.events.create(testRunId, {
-          eventType: 'step_started' as const,
-          correlationId: 'corr_validated',
-        });
-
-        expect(parseSpy).toHaveBeenCalledTimes(1);
-        expect(parseSpy).toHaveBeenCalledWith(
-          expect.objectContaining({
-            runId: testRunId,
-            eventType: 'step_started',
-            correlationId: 'corr_validated',
-          })
-        );
-
-        parseSpy.mockRestore();
-      });
     });
 
     describe('list', () => {
@@ -1351,26 +1288,6 @@ describe('Storage', () => {
           `Hook with token ${token} already exists for this project`
         );
       });
-
-      it('should validate hook against schema before writing', async () => {
-        const parseSpy = vi.spyOn(HookSchema, 'parse');
-
-        await storage.hooks.create(testRunId, {
-          hookId: 'hook_validated',
-          token: 'validated-token',
-        });
-
-        expect(parseSpy).toHaveBeenCalledTimes(1);
-        expect(parseSpy).toHaveBeenCalledWith(
-          expect.objectContaining({
-            runId: testRunId,
-            hookId: 'hook_validated',
-            token: 'validated-token',
-          })
-        );
-
-        parseSpy.mockRestore();
-      });
     });
 
     describe('get', () => {

From 038cdd664c38aec68c082e38cc4c64f28689d494 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 13:46:52 -0800
Subject: [PATCH 14/27] Remove fatal field from step_failed event
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

step_failed now implies terminal failure. Non-fatal failures use step_retrying event instead.

- Remove `fatal` field from StepFailedEventSchema
- Remove `fatal: true` from step_failed event creation in step-handler
- Simplify step_failed handling in world implementations to always mark as failed
- Update step_started to leave items in queue for re-enqueueing
- Update tests and changeset

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .changeset/event-sourced-entities.md         |  4 +-
 packages/core/src/runtime/step-handler.ts    |  3 -
 packages/core/src/step.test.ts               |  1 -
 packages/core/src/step.ts                    | 61 ++++++--------------
 packages/core/src/workflow.test.ts           |  5 +-
 packages/world-local/src/storage.test.ts     |  2 +-
 packages/world-local/src/storage.ts          | 28 +++------
 packages/world-postgres/src/storage.ts       | 21 ++-----
 packages/world-postgres/test/storage.test.ts |  2 +-
 packages/world/src/events.ts                 |  1 -
 10 files changed, 40 insertions(+), 88 deletions(-)

diff --git a/.changeset/event-sourced-entities.md b/.changeset/event-sourced-entities.md
index 27cdb84c0..073d2e24e 100644
--- a/.changeset/event-sourced-entities.md
+++ b/.changeset/event-sourced-entities.md
@@ -8,7 +8,9 @@
 
 perf: implement event-sourced architecture for runs, steps, and hooks
 
-- Add run lifecycle events (run_created, run_started, run_completed, run_failed, run_cancelled, run_paused, run_resumed)
+- Add run lifecycle events (run_created, run_started, run_completed, run_failed, run_cancelled)
+- Add step_retrying event for non-fatal step failures that will be retried
+- Remove `fatal` field from step_failed event (step_failed now implies terminal failure)
 - Update world implementations to create/update entities from events via events.create()
 - Entities (runs, steps, hooks) are now materializations of the event log
 - This makes the system faster, easier to reason about, and resilient to data inconsistencies
diff --git a/packages/core/src/runtime/step-handler.ts b/packages/core/src/runtime/step-handler.ts
index fad6e2ff3..448e81ad1 100644
--- a/packages/core/src/runtime/step-handler.ts
+++ b/packages/core/src/runtime/step-handler.ts
@@ -130,7 +130,6 @@ const stepHandler = getWorldHandlers().createQueueHandler(
               correlationId: stepId,
               eventData: {
                 error: errorMessage,
-                fatal: true,
               },
             });
 
@@ -302,7 +301,6 @@ const stepHandler = getWorldHandlers().createQueueHandler(
                 eventData: {
                   error: String(err),
                   stack: errorStack,
-                  fatal: true,
                 },
               });
 
@@ -335,7 +333,6 @@ const stepHandler = getWorldHandlers().createQueueHandler(
                   eventData: {
                     error: errorMessage,
                     stack: errorStack,
-                    fatal: true,
                   },
                 });
 
diff --git a/packages/core/src/step.test.ts b/packages/core/src/step.test.ts
index cd49e9c6c..8a3e129ca 100644
--- a/packages/core/src/step.test.ts
+++ b/packages/core/src/step.test.ts
@@ -59,7 +59,6 @@ describe('createUseStep', () => {
         correlationId: 'step_01K11TFZ62YS0YYFDQ3E8B9YCV',
         eventData: {
           error: 'test',
-          fatal: true,
         },
         createdAt: new Date(),
       },
diff --git a/packages/core/src/step.ts b/packages/core/src/step.ts
index 63bca807d..78af0930a 100644
--- a/packages/core/src/step.ts
+++ b/packages/core/src/step.ts
@@ -32,11 +32,6 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
 
       ctx.invocationsQueue.set(correlationId, queueItem);
 
-      // Track whether we've already seen a "step_started" event for this step.
-      // This is important because after a retryable failure, the step moves back to
-      // "pending" status which causes another "step_started" event to be emitted.
-      let hasSeenStepStarted = false;
-
       stepLogger.debug('Step consumer setup', {
         correlationId,
         stepName,
@@ -93,52 +88,32 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
         }
 
         if (event.eventType === 'step_started') {
-          // Step has started - so remove from the invocations queue (only on the first "step_started" event)
-          if (!hasSeenStepStarted) {
-            // O(1) lookup and delete using Map
-            if (ctx.invocationsQueue.has(correlationId)) {
-              ctx.invocationsQueue.delete(correlationId);
-            } else {
-              // This indicates event log corruption - step_started received without
-              // the step being in the invocation queue. This typically means step_created
-              // was missing from the event log, or the step was never invoked during replay.
-              setTimeout(() => {
-                reject(
-                  new WorkflowRuntimeError(
-                    `Corrupted event log: step ${correlationId} (${stepName}) started but not found in invocation queue (missing step_created event?)`
-                  )
-                );
-              }, 0);
-              return EventConsumerResult.Finished;
-            }
-            hasSeenStepStarted = true;
-          }
-          // If this is a subsequent "step_started" event (after a retry), we just consume it
-          // without trying to remove from the queue again or logging a warning
+          // Step was started - don't do anything. The step is left in the invocationQueue which
+          // will allow it to be re-enqueued. We rely on the queue's idempotency to prevent it from
+          // actually being over enqueued.
           return EventConsumerResult.Consumed;
         }
 
-        if (event.eventType === 'step_failed') {
-          // Step failed - bubble up to workflow
-          if (event.eventData.fatal) {
-            setTimeout(() => {
-              reject(new FatalError(event.eventData.error));
-            }, 0);
-            return EventConsumerResult.Finished;
-          } else {
-            // This is a retryable error, so nothing to do here,
-            // but we will consume the event
-            return EventConsumerResult.Consumed;
-          }
-        }
-
         if (event.eventType === 'step_retrying') {
           // Step is being retried - just consume the event and wait for next step_started
           return EventConsumerResult.Consumed;
         }
 
+        if (event.eventType === 'step_failed') {
+          // Terminal state - we can remove the invocationQueue item
+          ctx.invocationsQueue.delete(event.correlationId);
+          // Step failed - bubble up to workflow
+          setTimeout(() => {
+            reject(new FatalError(event.eventData.error));
+          }, 0);
+          return EventConsumerResult.Finished;
+        }
+
         if (event.eventType === 'step_completed') {
-          // Step has already completed, so resolve the Promise with the cached result
+          // Terminal state - we can remove the invocationQueue item
+          ctx.invocationsQueue.delete(event.correlationId);
+
+          // Step has completed, so resolve the Promise with the cached result
           const hydratedResult = hydrateStepReturnValue(
             event.eventData.result,
             ctx.globalThis
@@ -153,7 +128,7 @@ export function createUseStep(ctx: WorkflowOrchestratorContext) {
         setTimeout(() => {
           reject(
             new WorkflowRuntimeError(
-              `Unexpected event type: "${event.eventType}"`
+              `Unexpected event type for step ${correlationId} (${stepName}) "${event.eventType}"`
             )
           );
         }, 0);
diff --git a/packages/core/src/workflow.test.ts b/packages/core/src/workflow.test.ts
index c150c5e88..707bd200e 100644
--- a/packages/core/src/workflow.test.ts
+++ b/packages/core/src/workflow.test.ts
@@ -895,8 +895,9 @@ describe('runWorkflow', () => {
       }
       assert(error);
       expect(error.name).toEqual('WorkflowSuspension');
-      expect(error.message).toEqual('0 steps have not been run yet');
-      expect((error as WorkflowSuspension).steps).toEqual([]);
+      // step_started no longer removes from queue - step stays in queue for re-enqueueing
+      expect(error.message).toEqual('1 step has not been run yet');
+      expect((error as WorkflowSuspension).steps).toHaveLength(1);
     });
 
     it('should throw `WorkflowSuspension` for multiple steps with `Promise.all()`', async () => {
diff --git a/packages/world-local/src/storage.test.ts b/packages/world-local/src/storage.test.ts
index 4b5461aaf..c4c4f3fe8 100644
--- a/packages/world-local/src/storage.test.ts
+++ b/packages/world-local/src/storage.test.ts
@@ -469,7 +469,7 @@ describe('Storage', () => {
           testRunId,
           'step_123',
           'step_failed',
-          { error: 'Step failed', fatal: true }
+          { error: 'Step failed' }
         );
 
         expect(updated.status).toBe('failed');
diff --git a/packages/world-local/src/storage.ts b/packages/world-local/src/storage.ts
index d706eff71..6536354cf 100644
--- a/packages/world-local/src/storage.ts
+++ b/packages/world-local/src/storage.ts
@@ -529,12 +529,10 @@ export function createStorage(basedir: string): Storage {
             await writeJSON(stepPath, step, { overwrite: true });
           }
         } else if (data.eventType === 'step_failed' && 'eventData' in data) {
-          // step_failed: Terminal state with error (only if fatal=true)
-          // Always records lastKnownError regardless of fatal flag
+          // step_failed: Terminal state with error
           const failedData = data.eventData as {
             error: any;
             stack?: string;
-            fatal?: boolean;
           };
           const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
           const stepPath = path.join(
@@ -551,23 +549,13 @@ export function createStorage(basedir: string): Storage {
                   : (failedData.error?.message ?? 'Unknown error'),
               stack: failedData.stack,
             };
-            // Only mark step as failed if fatal=true, otherwise just record the error
-            if (failedData.fatal) {
-              step = {
-                ...existingStep,
-                status: 'failed',
-                lastKnownError,
-                completedAt: now,
-                updatedAt: now,
-              };
-            } else {
-              // Non-fatal: just record the error, keep status unchanged
-              step = {
-                ...existingStep,
-                lastKnownError,
-                updatedAt: now,
-              };
-            }
+            step = {
+              ...existingStep,
+              status: 'failed',
+              lastKnownError,
+              completedAt: now,
+              updatedAt: now,
+            };
             await writeJSON(stepPath, step, { overwrite: true });
           }
         } else if (data.eventType === 'step_retrying' && 'eventData' in data) {
diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index 764d2f869..072c8775a 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -394,13 +394,11 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
         }
       }
 
-      // Handle step_failed event: terminal state with error (only if fatal=true)
-      // Always records lastKnownError regardless of fatal flag
+      // Handle step_failed event: terminal state with error
       if (data.eventType === 'step_failed') {
         const eventData = (data as any).eventData as {
           error?: any;
           stack?: string;
-          fatal?: boolean;
         };
         // Store structured error as JSON for deserializeStepError to parse
         const errorMessage =
@@ -412,20 +410,13 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
           stack: eventData.stack,
         });
 
-        const updateData: Partial<typeof Schema.steps._.inferInsert> = {
-          // Always record the error in lastKnownError (stored as 'error' column)
-          error: errorJson,
-        };
-
-        // Only mark step as failed if fatal=true
-        if (eventData.fatal) {
-          updateData.status = 'failed';
-          updateData.completedAt = now;
-        }
-
         const [stepValue] = await drizzle
           .update(Schema.steps)
-          .set(updateData)
+          .set({
+            status: 'failed',
+            error: errorJson,
+            completedAt: now,
+          })
           .where(
             and(
               eq(Schema.steps.runId, effectiveRunId),
diff --git a/packages/world-postgres/test/storage.test.ts b/packages/world-postgres/test/storage.test.ts
index ae3a9d30b..fe5983905 100644
--- a/packages/world-postgres/test/storage.test.ts
+++ b/packages/world-postgres/test/storage.test.ts
@@ -471,7 +471,7 @@ describe('Storage (Postgres integration)', () => {
           testRunId,
           'step-123',
           'step_failed',
-          { error: 'Step failed', fatal: true }
+          { error: 'Step failed' }
         );
 
         expect(updated.status).toBe('failed');
diff --git a/packages/world/src/events.ts b/packages/world/src/events.ts
index a5e7c16c5..005c22f1f 100644
--- a/packages/world/src/events.ts
+++ b/packages/world/src/events.ts
@@ -52,7 +52,6 @@ const StepFailedEventSchema = BaseEventSchema.extend({
   eventData: z.object({
     error: z.any(),
     stack: z.string().optional(),
-    fatal: z.boolean().optional(),
   }),
 });
 

From 6f26c566b32d1abd65516a00f522b7cf6b003d50 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 14:42:54 -0800
Subject: [PATCH 15/27] Rename step's lastKnownError to error
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Simplifies the Step interface by using `error` instead of `lastKnownError`,
reducing complexity and drift between server and client.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .changeset/event-sourced-entities.md          |  3 +
 packages/core/src/runtime/step-handler.ts     |  2 +-
 .../src/sidebar/attribute-panel.tsx           | 63 -------------------
 .../lib/flow-graph/graph-execution-mapper.ts  |  6 +-
 packages/world-local/src/storage.test.ts      |  4 +-
 packages/world-local/src/storage.ts           | 10 +--
 packages/world-postgres/src/drizzle/schema.ts |  6 +-
 packages/world-postgres/src/storage.ts        | 10 +--
 packages/world-postgres/test/storage.test.ts  |  4 +-
 packages/world-vercel/src/events.ts           | 10 +--
 packages/world-vercel/src/steps.ts            | 22 +++----
 packages/world/src/events.ts                  |  2 +-
 packages/world/src/steps.ts                   |  6 +-
 13 files changed, 44 insertions(+), 104 deletions(-)

diff --git a/.changeset/event-sourced-entities.md b/.changeset/event-sourced-entities.md
index 073d2e24e..3a528c589 100644
--- a/.changeset/event-sourced-entities.md
+++ b/.changeset/event-sourced-entities.md
@@ -4,6 +4,8 @@
 "@workflow/world-local": patch
 "@workflow/world-postgres": patch
 "@workflow/world-vercel": patch
+"@workflow/web": patch
+"@workflow/web-shared": patch
 ---
 
 perf: implement event-sourced architecture for runs, steps, and hooks
@@ -11,6 +13,7 @@ perf: implement event-sourced architecture for runs, steps, and hooks
 - Add run lifecycle events (run_created, run_started, run_completed, run_failed, run_cancelled)
 - Add step_retrying event for non-fatal step failures that will be retried
 - Remove `fatal` field from step_failed event (step_failed now implies terminal failure)
+- Rename step's `lastKnownError` to `error` for consistency with server
 - Update world implementations to create/update entities from events via events.create()
 - Entities (runs, steps, hooks) are now materializations of the event log
 - This makes the system faster, easier to reason about, and resilient to data inconsistencies
diff --git a/packages/core/src/runtime/step-handler.ts b/packages/core/src/runtime/step-handler.ts
index 448e81ad1..42a1f4434 100644
--- a/packages/core/src/runtime/step-handler.ts
+++ b/packages/core/src/runtime/step-handler.ts
@@ -353,7 +353,7 @@ const stepHandler = getWorldHandlers().createQueueHandler(
                   );
                 }
                 // Set step to pending for retry via event (event-sourced architecture)
-                // step_retrying records the error in lastKnownError and sets status to pending
+                // step_retrying records the error and sets status to pending
                 const errorStack = getErrorStack(err);
                 await world.events.create(workflowRunId, {
                   eventType: 'step_retrying',
diff --git a/packages/web-shared/src/sidebar/attribute-panel.tsx b/packages/web-shared/src/sidebar/attribute-panel.tsx
index 0a668c1b0..0a521e7b1 100644
--- a/packages/web-shared/src/sidebar/attribute-panel.tsx
+++ b/packages/web-shared/src/sidebar/attribute-panel.tsx
@@ -310,7 +310,6 @@ const attributeOrder: AttributeKey[] = [
   'expiredAt',
   'retryAfter',
   'error',
-  'lastKnownError',
   'metadata',
   'eventData',
   'input',
@@ -519,67 +518,6 @@ const attributeToDisplayFn: Record<
       </DetailCard>
     );
   },
-  lastKnownError: (value: unknown) => {
-    // Handle structured error format (same as error, but for step's lastKnownError)
-    if (value && typeof value === 'object' && 'message' in value) {
-      const error = value as {
-        message: string;
-        stack?: string;
-        code?: string;
-      };
-
-      return (
-        <DetailCard summary="Last Known Error">
-          <div className="flex flex-col gap-2">
-            {error.code && (
-              <div>
-                <span
-                  className="text-[11px] font-medium"
-                  style={{ color: 'var(--ds-gray-700)' }}
-                >
-                  Error Code:{' '}
-                </span>
-                <code
-                  className="text-[11px]"
-                  style={{ color: 'var(--ds-gray-1000)' }}
-                >
-                  {error.code}
-                </code>
-              </div>
-            )}
-            <pre
-              className="text-[11px] overflow-x-auto rounded-md border p-3"
-              style={{
-                borderColor: 'var(--ds-gray-300)',
-                backgroundColor: 'var(--ds-gray-100)',
-                color: 'var(--ds-gray-1000)',
-                whiteSpace: 'pre-wrap',
-              }}
-            >
-              <code>{error.stack || error.message}</code>
-            </pre>
-          </div>
-        </DetailCard>
-      );
-    }
-
-    // Fallback for plain string errors
-    return (
-      <DetailCard summary="Last Known Error">
-        <pre
-          className="text-[11px] overflow-x-auto rounded-md border p-3"
-          style={{
-            borderColor: 'var(--ds-gray-300)',
-            backgroundColor: 'var(--ds-gray-100)',
-            color: 'var(--ds-gray-1000)',
-            whiteSpace: 'pre-wrap',
-          }}
-        >
-          <code>{String(value)}</code>
-        </pre>
-      </DetailCard>
-    );
-  },
   eventData: (value: unknown) => {
     return <DetailCard summary="Event Data">{JsonBlock(value)}</DetailCard>;
   },
@@ -589,7 +527,6 @@ const resolvableAttributes = [
   'input',
   'output',
   'error',
-  'lastKnownError',
   'metadata',
   'eventData',
 ];
diff --git a/packages/web/src/lib/flow-graph/graph-execution-mapper.ts b/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
index 4d290a80a..2655b9738 100644
--- a/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
+++ b/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
@@ -73,10 +73,10 @@ function createStepExecution(
     duration,
     input: attemptStep.input,
     output: attemptStep.output,
-    error: attemptStep.lastKnownError
+    error: attemptStep.error
       ? {
-          message: attemptStep.lastKnownError.message,
-          stack: attemptStep.lastKnownError.stack || '',
+          message: attemptStep.error.message,
+          stack: attemptStep.error.stack || '',
         }
       : undefined,
   };
diff --git a/packages/world-local/src/storage.test.ts b/packages/world-local/src/storage.test.ts
index c4c4f3fe8..7dddaa72c 100644
--- a/packages/world-local/src/storage.test.ts
+++ b/packages/world-local/src/storage.test.ts
@@ -363,7 +363,7 @@ describe('Storage', () => {
         expect(step.status).toBe('pending');
         expect(step.input).toEqual(['input1', 'input2']);
         expect(step.output).toBeUndefined();
-        expect(step.lastKnownError).toBeUndefined();
+        expect(step.error).toBeUndefined();
         expect(step.attempt).toBe(0);
         expect(step.firstStartedAt).toBeUndefined();
         expect(step.completedAt).toBeUndefined();
@@ -473,7 +473,7 @@ describe('Storage', () => {
         );
 
         expect(updated.status).toBe('failed');
-        expect(updated.lastKnownError?.message).toBe('Step failed');
+        expect(updated.error?.message).toBe('Step failed');
         expect(updated.completedAt).toBeInstanceOf(Date);
       });
     });
diff --git a/packages/world-local/src/storage.ts b/packages/world-local/src/storage.ts
index 6536354cf..fcb7941c4 100644
--- a/packages/world-local/src/storage.ts
+++ b/packages/world-local/src/storage.ts
@@ -472,7 +472,7 @@ export function createStorage(basedir: string): Storage {
             status: 'pending',
             input: stepData.input,
             output: undefined,
-            lastKnownError: undefined,
+            error: undefined,
             attempt: 0,
             firstStartedAt: undefined,
             completedAt: undefined,
@@ -542,7 +542,7 @@ export function createStorage(basedir: string): Storage {
           );
           const existingStep = await readJSON(stepPath, StepSchema);
           if (existingStep) {
-            const lastKnownError = {
+            const error = {
               message:
                 typeof failedData.error === 'string'
                   ? failedData.error
@@ -552,14 +552,14 @@ export function createStorage(basedir: string): Storage {
             step = {
               ...existingStep,
               status: 'failed',
-              lastKnownError,
+              error,
               completedAt: now,
               updatedAt: now,
             };
             await writeJSON(stepPath, step, { overwrite: true });
           }
         } else if (data.eventType === 'step_retrying' && 'eventData' in data) {
-          // step_retrying: Sets status back to 'pending', records error in lastKnownError
+          // step_retrying: Sets status back to 'pending', records error
           const retryData = data.eventData as {
             error: any;
             stack?: string;
@@ -576,7 +576,7 @@ export function createStorage(basedir: string): Storage {
             step = {
               ...existingStep,
               status: 'pending',
-              lastKnownError: {
+              error: {
                 message:
                   typeof retryData.error === 'string'
                     ? retryData.error
diff --git a/packages/world-postgres/src/drizzle/schema.ts b/packages/world-postgres/src/drizzle/schema.ts
index dafcd5eb4..d5e43224d 100644
--- a/packages/world-postgres/src/drizzle/schema.ts
+++ b/packages/world-postgres/src/drizzle/schema.ts
@@ -107,7 +107,7 @@ export const events = schema.table(
 
 /**
  * Database schema for steps. Note: DB column names differ from Step interface:
- * - error (DB) → lastKnownError (Step interface)
+ * - error (DB) → error (Step interface, parsed from JSON string)
  * - startedAt (DB) → firstStartedAt (Step interface)
  * The mapping is done in storage.ts deserializeStepError()
  */
@@ -124,7 +124,7 @@ export const steps = schema.table(
     /** @deprecated we stream binary data */
     outputJson: jsonb('output').$type<SerializedContent>(),
     output: Cbor<SerializedContent>()('output_cbor'),
-    /** Maps to lastKnownError in Step interface */
+    /** JSON-stringified StructuredError - parsed and set as error in Step interface */
     error: text('error'),
     attempt: integer('attempt').notNull(),
     /** Maps to firstStartedAt in Step interface */
@@ -138,7 +138,7 @@ export const steps = schema.table(
     retryAfter: timestamp('retry_after'),
   } satisfies DrizzlishOfType<
     Cborized<
-      Omit<Step, 'input' | 'lastKnownError' | 'firstStartedAt'> & {
+      Omit<Step, 'input' | 'error' | 'firstStartedAt'> & {
         input?: unknown;
         error?: string;
         startedAt?: Date;
diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index 072c8775a..a0a32443a 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -69,7 +69,7 @@ function deserializeRunError(run: any): WorkflowRun {
 
 /**
  * Deserialize step data, mapping DB columns to interface fields:
- * - `error` (DB column) → `lastKnownError` (Step interface)
+ * - `error` (DB column) → `error` (Step interface, parsed from JSON)
  * - `startedAt` (DB column) → `firstStartedAt` (Step interface)
  */
 function deserializeStepError(step: any): Step {
@@ -89,7 +89,7 @@ function deserializeStepError(step: any): Step {
   try {
     const parsed = JSON.parse(error);
     if (typeof parsed === 'object' && parsed.message !== undefined) {
-      result.lastKnownError = {
+      result.error = {
         message: parsed.message,
         stack: parsed.stack,
         code: parsed.code,
@@ -101,7 +101,7 @@ function deserializeStepError(step: any): Step {
   }
 
   // Backwards compatibility: handle legacy separate fields or plain string error
-  result.lastKnownError = {
+  result.error = {
     message: error || '',
   };
   return result as Step;
@@ -429,14 +429,14 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
         }
       }
 
-      // Handle step_retrying event: sets status back to 'pending', records error in lastKnownError
+      // Handle step_retrying event: sets status back to 'pending', records error
       if (data.eventType === 'step_retrying') {
         const eventData = (data as any).eventData as {
           error?: any;
           stack?: string;
           retryAfter?: Date;
         };
-        // Store error in lastKnownError (stored as 'error' column)
+        // Store error as JSON in 'error' column
         const errorMessage =
           typeof eventData.error === 'string'
             ? eventData.error
diff --git a/packages/world-postgres/test/storage.test.ts b/packages/world-postgres/test/storage.test.ts
index fe5983905..fb1d730c0 100644
--- a/packages/world-postgres/test/storage.test.ts
+++ b/packages/world-postgres/test/storage.test.ts
@@ -376,7 +376,7 @@ describe('Storage (Postgres integration)', () => {
           status: 'pending',
           input: ['input1', 'input2'],
           output: undefined,
-          lastKnownError: undefined,
+          error: undefined,
           attempt: 0, // steps are created with attempt 0
           firstStartedAt: undefined,
           completedAt: undefined,
@@ -475,7 +475,7 @@ describe('Storage (Postgres integration)', () => {
         );
 
         expect(updated.status).toBe('failed');
-        expect(updated.lastKnownError?.message).toBe('Step failed');
+        expect(updated.error?.message).toBe('Step failed');
         expect(updated.completedAt).toBeInstanceOf(Date);
       });
     });
diff --git a/packages/world-vercel/src/events.ts b/packages/world-vercel/src/events.ts
index ca8ef99cc..7d618b5f6 100644
--- a/packages/world-vercel/src/events.ts
+++ b/packages/world-vercel/src/events.ts
@@ -27,7 +27,7 @@ import {
  * Maps server field names to Step interface field names.
  */
 const StepWireSchema = StepSchema.omit({
-  lastKnownError: true,
+  error: true,
   firstStartedAt: true,
 }).extend({
   // Backend returns error either as:
@@ -66,19 +66,19 @@ function deserializeStep(wireStep: z.infer<typeof StepWireSchema>): Step {
       try {
         const parsed = JSON.parse(errorSource);
         if (typeof parsed === 'object' && parsed.message !== undefined) {
-          result.lastKnownError = {
+          result.error = {
             message: parsed.message,
             stack: parsed.stack,
             code: parsed.code,
           };
         } else {
-          result.lastKnownError = { message: String(parsed) };
+          result.error = { message: String(parsed) };
         }
       } catch {
-        result.lastKnownError = { message: errorSource };
+        result.error = { message: errorSource };
       }
     } else if (typeof errorSource === 'object' && errorSource !== null) {
-      result.lastKnownError = {
+      result.error = {
         message: errorSource.message ?? 'Unknown error',
         stack: errorSource.stack,
         code: errorSource.code,
diff --git a/packages/world-vercel/src/steps.ts b/packages/world-vercel/src/steps.ts
index 17cd42356..10fa87d3d 100644
--- a/packages/world-vercel/src/steps.ts
+++ b/packages/world-vercel/src/steps.ts
@@ -19,20 +19,20 @@ import {
 /**
  * Wire format schema for steps coming from the backend.
  * The backend returns:
- * - error/errorRef as a JSON string (maps to lastKnownError in Step interface)
+ * - error/errorRef as a JSON string (maps to error in Step interface)
  * - startedAt (maps to firstStartedAt in Step interface)
  *
  * This is used for validation in makeRequest(), then deserializeStep()
  * transforms the wire format into the expected Step interface.
  */
 const StepWireSchema = StepSchema.omit({
-  lastKnownError: true,
+  error: true,
   firstStartedAt: true,
 }).extend({
   // Backend returns error either as:
   // - A JSON string (legacy/lazy mode)
   // - An object {message, stack} (when errorRef is resolved)
-  // This will be deserialized and mapped to lastKnownError
+  // This will be deserialized and mapped to error
   error: z
     .union([
       z.string(),
@@ -63,7 +63,7 @@ const StepWireWithRefsSchema = StepWireSchema.omit({
 /**
  * Transform step from wire format to Step interface format.
  * Maps:
- * - error/errorRef → lastKnownError (deserializing JSON string to StructuredError)
+ * - error/errorRef → error (deserializing JSON string to StructuredError)
  * - startedAt → firstStartedAt
  */
 function deserializeStep(wireStep: any): Step {
@@ -85,22 +85,22 @@ function deserializeStep(wireStep: any): Step {
       try {
         const parsed = JSON.parse(errorSource);
         if (typeof parsed === 'object' && parsed.message !== undefined) {
-          result.lastKnownError = {
+          result.error = {
             message: parsed.message,
             stack: parsed.stack,
             code: parsed.code,
           };
         } else {
           // Parsed but not an object with message
-          result.lastKnownError = { message: String(parsed) };
+          result.error = { message: String(parsed) };
         }
       } catch {
         // Not JSON, treat as plain string
-        result.lastKnownError = { message: errorSource };
+        result.error = { message: errorSource };
       }
     } else if (typeof errorSource === 'object' && errorSource !== null) {
       // Already an object (from resolved ref)
-      result.lastKnownError = {
+      result.error = {
         message: errorSource.message ?? 'Unknown error',
         stack: errorSource.stack,
         code: errorSource.code,
@@ -189,10 +189,10 @@ export async function updateStep(
   config?: APIConfig
 ): Promise<Step> {
   // Map interface field names to wire format field names
-  const { lastKnownError, ...rest } = data;
+  const { error: stepError, ...rest } = data;
   const wireData: any = { ...rest };
-  if (lastKnownError) {
-    wireData.error = JSON.stringify(lastKnownError);
+  if (stepError) {
+    wireData.error = JSON.stringify(stepError);
   }
   const step = await makeRequest({
     endpoint: `/v1/runs/${runId}/steps/${stepId}`,
diff --git a/packages/world/src/events.ts b/packages/world/src/events.ts
index 005c22f1f..a923cb3e7 100644
--- a/packages/world/src/events.ts
+++ b/packages/world/src/events.ts
@@ -58,7 +58,7 @@ const StepFailedEventSchema = BaseEventSchema.extend({
 /**
  * Event created when a step fails and will be retried.
  * Sets the step status back to 'pending' and records the error.
- * The error is stored in step.lastKnownError for debugging.
+ * The error is stored in step.error for debugging.
  */
 const StepRetryingEventSchema = BaseEventSchema.extend({
   eventType: z.literal('step_retrying'),
diff --git a/packages/world/src/steps.ts b/packages/world/src/steps.ts
index 84bc9fd23..56749fe4e 100644
--- a/packages/world/src/steps.ts
+++ b/packages/world/src/steps.ts
@@ -25,11 +25,11 @@ export const StepSchema = z.object({
   input: z.array(z.any()),
   output: z.any().optional(),
   /**
-   * The last known error from a step_retrying or step_failed event.
+   * The error from a step_retrying or step_failed event.
    * This tracks the most recent error the step encountered, which may
    * be from a retry attempt (step_retrying) or the final failure (step_failed).
    */
-  lastKnownError: StructuredErrorSchema.optional(),
+  error: StructuredErrorSchema.optional(),
   attempt: z.number(),
   /**
    * When the step first started executing. Set by the first step_started event
@@ -57,7 +57,7 @@ export interface UpdateStepRequest {
   attempt?: number;
   status?: StepStatus;
   output?: SerializedData;
-  lastKnownError?: StructuredError;
+  error?: StructuredError;
   retryAfter?: Date;
 }
 

From 88e61fd7c88a12a60c454c068460a5fc7a6368e7 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 19:31:39 -0800
Subject: [PATCH 16/27] Add terminal state validation and comprehensive event
 lifecycle tests
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Implement terminal state validation in world-local storage:
  - Reject modifications to completed/failed steps
  - Reject state transitions on terminal runs (completed/failed/cancelled)
  - Allow completing/failing in-progress steps on terminal runs
  - Reject creating new entities on terminal runs
  - Support idempotent run_cancelled on already cancelled runs
  - Validate entity existence before step/hook update events

- Add comprehensive test suites to world-local and world-postgres:
  - Step terminal state validation (6 tests)
  - Run terminal state validation (9 tests)
  - Allowed operations on terminal runs (3 tests)
  - Disallowed operations on terminal runs (7 tests)
  - Idempotent operations (1 test)
  - step_retrying event handling (4 tests)
  - Run cancellation with in-flight entities (3 tests)
  - Event ordering validation (6 tests)

- Update existing tests to follow proper event ordering (create steps
  before step events)

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-local/src/storage.test.ts     | 916 ++++++++++++++++++-
 packages/world-local/src/storage.ts          | 141 +++
 packages/world-postgres/test/storage.test.ts | 759 +++++++++++++++
 3 files changed, 1793 insertions(+), 23 deletions(-)

diff --git a/packages/world-local/src/storage.test.ts b/packages/world-local/src/storage.test.ts
index 7dddaa72c..1bdcd3f56 100644
--- a/packages/world-local/src/storage.test.ts
+++ b/packages/world-local/src/storage.test.ts
@@ -751,6 +751,13 @@ describe('Storage', () => {
 
     describe('create', () => {
       it('should create a new event', async () => {
+        // Create step first (required for step events)
+        await createStep(storage, testRunId, {
+          stepId: 'corr_123',
+          stepName: 'test-step',
+          input: [],
+        });
+
         const eventData = {
           eventType: 'step_started' as const,
           correlationId: 'corr_123',
@@ -799,6 +806,15 @@ describe('Storage', () => {
         // Small delay to ensure different timestamps in event IDs
         await new Promise((resolve) => setTimeout(resolve, 2));
 
+        // Create the step first (required for step events)
+        await createStep(storage, testRunId, {
+          stepId: 'corr_step_1',
+          stepName: 'test-step',
+          input: [],
+        });
+
+        await new Promise((resolve) => setTimeout(resolve, 2));
+
         const { event: event2 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId: 'corr_step_1',
@@ -809,14 +825,15 @@ describe('Storage', () => {
           pagination: { sortOrder: 'asc' }, // Explicitly request ascending order
         });
 
-        // 3 events: run_created (from createRun), workflow_started, step_started
-        expect(result.data).toHaveLength(3);
+        // 4 events: run_created (from createRun), workflow_started, step_created, step_started
+        expect(result.data).toHaveLength(4);
         // Should be in chronological order (oldest first)
         expect(result.data[0].eventType).toBe('run_created');
         expect(result.data[1].eventId).toBe(event1.eventId);
-        expect(result.data[2].eventId).toBe(event2.eventId);
-        expect(result.data[2].createdAt.getTime()).toBeGreaterThanOrEqual(
-          result.data[1].createdAt.getTime()
+        expect(result.data[2].eventType).toBe('step_created');
+        expect(result.data[3].eventId).toBe(event2.eventId);
+        expect(result.data[3].createdAt.getTime()).toBeGreaterThanOrEqual(
+          result.data[2].createdAt.getTime()
         );
       });
 
@@ -829,6 +846,15 @@ describe('Storage', () => {
         // Small delay to ensure different timestamps in event IDs
         await new Promise((resolve) => setTimeout(resolve, 2));
 
+        // Create the step first (required for step events)
+        await createStep(storage, testRunId, {
+          stepId: 'corr_step_1',
+          stepName: 'test-step',
+          input: [],
+        });
+
+        await new Promise((resolve) => setTimeout(resolve, 2));
+
         const { event: event2 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId: 'corr_step_1',
@@ -839,20 +865,26 @@ describe('Storage', () => {
           pagination: { sortOrder: 'desc' },
         });
 
-        // 3 events: run_created (from createRun), workflow_started, step_started
-        expect(result.data).toHaveLength(3);
+        // 4 events: run_created (from createRun), workflow_started, step_created, step_started
+        expect(result.data).toHaveLength(4);
         // Should be in reverse chronological order (newest first)
         expect(result.data[0].eventId).toBe(event2.eventId);
-        expect(result.data[1].eventId).toBe(event1.eventId);
-        expect(result.data[2].eventType).toBe('run_created');
+        expect(result.data[1].eventType).toBe('step_created');
+        expect(result.data[2].eventId).toBe(event1.eventId);
+        expect(result.data[3].eventType).toBe('run_created');
         expect(result.data[0].createdAt.getTime()).toBeGreaterThanOrEqual(
           result.data[1].createdAt.getTime()
         );
       });
 
       it('should support pagination', async () => {
-        // Create multiple events
+        // Create steps first, then create step_completed events
         for (let i = 0; i < 5; i++) {
+          await createStep(storage, testRunId, {
+            stepId: `corr_${i}`,
+            stepName: `step-${i}`,
+            input: [],
+          });
           await storage.events.create(testRunId, {
             eventType: 'step_completed' as const,
             correlationId: `corr_${i}`,
@@ -882,6 +914,20 @@ describe('Storage', () => {
       it('should list all events with a specific correlation ID', async () => {
         const correlationId = 'step-abc123';
 
+        // Create the step first (required for step events)
+        await createStep(storage, testRunId, {
+          stepId: correlationId,
+          stepName: 'test-step',
+          input: [],
+        });
+
+        // Create step for the different correlation ID too
+        await createStep(storage, testRunId, {
+          stepId: 'different-step',
+          stepName: 'different-step',
+          input: [],
+        });
+
         // Create events with the target correlation ID
         const { event: event1 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
@@ -910,11 +956,15 @@ describe('Storage', () => {
           pagination: {},
         });
 
-        expect(result.data).toHaveLength(2);
-        expect(result.data[0].eventId).toBe(event1.eventId);
+        // step_created + step_started + step_completed = 3 events
+        expect(result.data).toHaveLength(3);
+        // First event is step_created from createStep
+        expect(result.data[0].eventType).toBe('step_created');
         expect(result.data[0].correlationId).toBe(correlationId);
-        expect(result.data[1].eventId).toBe(event2.eventId);
+        expect(result.data[1].eventId).toBe(event1.eventId);
         expect(result.data[1].correlationId).toBe(correlationId);
+        expect(result.data[2].eventId).toBe(event2.eventId);
+        expect(result.data[2].correlationId).toBe(correlationId);
       });
 
       it('should list events across multiple runs with same correlation ID', async () => {
@@ -964,6 +1014,13 @@ describe('Storage', () => {
       });
 
       it('should return empty list for non-existent correlation ID', async () => {
+        // Create the step first (required for step events)
+        await createStep(storage, testRunId, {
+          stepId: 'existing-step',
+          stepName: 'existing-step',
+          input: [],
+        });
+
         await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId: 'existing-step',
@@ -982,6 +1039,13 @@ describe('Storage', () => {
       it('should respect pagination parameters', async () => {
         const correlationId = 'step-paginated';
 
+        // Create the step first (required for step events)
+        await createStep(storage, testRunId, {
+          stepId: correlationId,
+          stepName: 'test-step',
+          input: [],
+        });
+
         // Create multiple events
         await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
@@ -993,7 +1057,14 @@ describe('Storage', () => {
         await storage.events.create(testRunId, {
           eventType: 'step_retrying' as const,
           correlationId,
-          eventData: { attempt: 1 },
+          eventData: { error: 'retry error' },
+        });
+
+        await new Promise((resolve) => setTimeout(resolve, 2));
+
+        await storage.events.create(testRunId, {
+          eventType: 'step_started' as const,
+          correlationId,
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
@@ -1004,7 +1075,7 @@ describe('Storage', () => {
           eventData: { result: 'success' },
         });
 
-        // Get first page
+        // Get first page (step_created + step_started = 2)
         const page1 = await storage.events.listByCorrelationId({
           correlationId,
           pagination: { limit: 2 },
@@ -1014,19 +1085,26 @@ describe('Storage', () => {
         expect(page1.hasMore).toBe(true);
         expect(page1.cursor).toBeDefined();
 
-        // Get second page
+        // Get second page (step_retrying + step_started + step_completed = 3)
         const page2 = await storage.events.listByCorrelationId({
           correlationId,
-          pagination: { limit: 2, cursor: page1.cursor || undefined },
+          pagination: { limit: 3, cursor: page1.cursor || undefined },
         });
 
-        expect(page2.data).toHaveLength(1);
+        expect(page2.data).toHaveLength(3);
         expect(page2.hasMore).toBe(false);
       });
 
       it('should filter event data when resolveData is "none"', async () => {
         const correlationId = 'step-with-data';
 
+        // Create the step first (required for step events)
+        await createStep(storage, testRunId, {
+          stepId: correlationId,
+          stepName: 'test-step',
+          input: [],
+        });
+
         await storage.events.create(testRunId, {
           eventType: 'step_completed' as const,
           correlationId,
@@ -1039,14 +1117,25 @@ describe('Storage', () => {
           resolveData: 'none',
         });
 
-        expect(result.data).toHaveLength(1);
+        // step_created + step_completed = 2 events
+        expect(result.data).toHaveLength(2);
         expect((result.data[0] as any).eventData).toBeUndefined();
+        expect((result.data[1] as any).eventData).toBeUndefined();
         expect(result.data[0].correlationId).toBe(correlationId);
       });
 
       it('should return events in ascending order by default', async () => {
         const correlationId = 'step-ordering';
 
+        // Create the step first (required for step events)
+        await createStep(storage, testRunId, {
+          stepId: correlationId,
+          stepName: 'test-step',
+          input: [],
+        });
+
+        await new Promise((resolve) => setTimeout(resolve, 2));
+
         // Create events with slight delays to ensure different timestamps
         const { event: event1 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
@@ -1066,9 +1155,12 @@ describe('Storage', () => {
           pagination: {},
         });
 
-        expect(result.data).toHaveLength(2);
-        expect(result.data[0].eventId).toBe(event1.eventId);
-        expect(result.data[1].eventId).toBe(event2.eventId);
+        // step_created + step_started + step_completed = 3 events
+        expect(result.data).toHaveLength(3);
+        // Verify order: step_created, step_started, step_completed
+        expect(result.data[0].eventType).toBe('step_created');
+        expect(result.data[1].eventId).toBe(event1.eventId);
+        expect(result.data[2].eventId).toBe(event2.eventId);
         expect(result.data[0].createdAt.getTime()).toBeLessThanOrEqual(
           result.data[1].createdAt.getTime()
         );
@@ -1077,6 +1169,15 @@ describe('Storage', () => {
       it('should support descending order', async () => {
         const correlationId = 'step-desc-order';
 
+        // Create the step first (required for step events)
+        await createStep(storage, testRunId, {
+          stepId: correlationId,
+          stepName: 'test-step',
+          input: [],
+        });
+
+        await new Promise((resolve) => setTimeout(resolve, 2));
+
         const { event: event1 } = await storage.events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId,
@@ -1095,9 +1196,12 @@ describe('Storage', () => {
           pagination: { sortOrder: 'desc' },
         });
 
-        expect(result.data).toHaveLength(2);
+        // step_created + step_started + step_completed = 3 events
+        expect(result.data).toHaveLength(3);
+        // Verify order: step_completed, step_started, step_created (descending)
         expect(result.data[0].eventId).toBe(event2.eventId);
         expect(result.data[1].eventId).toBe(event1.eventId);
+        expect(result.data[2].eventType).toBe('step_created');
         expect(result.data[0].createdAt.getTime()).toBeGreaterThanOrEqual(
           result.data[1].createdAt.getTime()
         );
@@ -1496,4 +1600,770 @@ describe('Storage', () => {
       });
     });
   });
+
+  describe('step terminal state validation', () => {
+    let testRunId: string;
+
+    beforeEach(async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      testRunId = run.runId;
+    });
+
+    describe('completed step', () => {
+      it('should reject step_started on completed step', async () => {
+        await createStep(storage, testRunId, {
+          stepId: 'step_terminal_1',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          storage,
+          testRunId,
+          'step_terminal_1',
+          'step_completed',
+          {
+            result: 'done',
+          }
+        );
+
+        await expect(
+          updateStep(storage, testRunId, 'step_terminal_1', 'step_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject step_completed on already completed step', async () => {
+        await createStep(storage, testRunId, {
+          stepId: 'step_terminal_2',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          storage,
+          testRunId,
+          'step_terminal_2',
+          'step_completed',
+          {
+            result: 'done',
+          }
+        );
+
+        await expect(
+          updateStep(storage, testRunId, 'step_terminal_2', 'step_completed', {
+            result: 'done again',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject step_failed on completed step', async () => {
+        await createStep(storage, testRunId, {
+          stepId: 'step_terminal_3',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          storage,
+          testRunId,
+          'step_terminal_3',
+          'step_completed',
+          {
+            result: 'done',
+          }
+        );
+
+        await expect(
+          updateStep(storage, testRunId, 'step_terminal_3', 'step_failed', {
+            error: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+
+    describe('failed step', () => {
+      it('should reject step_started on failed step', async () => {
+        await createStep(storage, testRunId, {
+          stepId: 'step_failed_1',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(storage, testRunId, 'step_failed_1', 'step_failed', {
+          error: 'Failed permanently',
+        });
+
+        await expect(
+          updateStep(storage, testRunId, 'step_failed_1', 'step_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject step_completed on failed step', async () => {
+        await createStep(storage, testRunId, {
+          stepId: 'step_failed_2',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(storage, testRunId, 'step_failed_2', 'step_failed', {
+          error: 'Failed permanently',
+        });
+
+        await expect(
+          updateStep(storage, testRunId, 'step_failed_2', 'step_completed', {
+            result: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject step_failed on already failed step', async () => {
+        await createStep(storage, testRunId, {
+          stepId: 'step_failed_3',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(storage, testRunId, 'step_failed_3', 'step_failed', {
+          error: 'Failed once',
+        });
+
+        await expect(
+          updateStep(storage, testRunId, 'step_failed_3', 'step_failed', {
+            error: 'Failed again',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+  });
+
+  describe('run terminal state validation', () => {
+    describe('completed run', () => {
+      it('should reject run_started on completed run', async () => {
+        const run = await createRun(storage, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(storage, run.runId, 'run_completed', {
+          output: 'done',
+        });
+
+        await expect(
+          updateRun(storage, run.runId, 'run_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_failed on completed run', async () => {
+        const run = await createRun(storage, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(storage, run.runId, 'run_completed', {
+          output: 'done',
+        });
+
+        await expect(
+          updateRun(storage, run.runId, 'run_failed', {
+            error: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_cancelled on completed run', async () => {
+        const run = await createRun(storage, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(storage, run.runId, 'run_completed', {
+          output: 'done',
+        });
+
+        await expect(
+          storage.events.create(run.runId, { eventType: 'run_cancelled' })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+
+    describe('failed run', () => {
+      it('should reject run_started on failed run', async () => {
+        const run = await createRun(storage, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(storage, run.runId, 'run_failed', { error: 'Failed' });
+
+        await expect(
+          updateRun(storage, run.runId, 'run_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_completed on failed run', async () => {
+        const run = await createRun(storage, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(storage, run.runId, 'run_failed', { error: 'Failed' });
+
+        await expect(
+          updateRun(storage, run.runId, 'run_completed', {
+            output: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_cancelled on failed run', async () => {
+        const run = await createRun(storage, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(storage, run.runId, 'run_failed', { error: 'Failed' });
+
+        await expect(
+          storage.events.create(run.runId, { eventType: 'run_cancelled' })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+
+    describe('cancelled run', () => {
+      it('should reject run_started on cancelled run', async () => {
+        const run = await createRun(storage, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await storage.events.create(run.runId, { eventType: 'run_cancelled' });
+
+        await expect(
+          updateRun(storage, run.runId, 'run_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_completed on cancelled run', async () => {
+        const run = await createRun(storage, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await storage.events.create(run.runId, { eventType: 'run_cancelled' });
+
+        await expect(
+          updateRun(storage, run.runId, 'run_completed', {
+            output: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_failed on cancelled run', async () => {
+        const run = await createRun(storage, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await storage.events.create(run.runId, { eventType: 'run_cancelled' });
+
+        await expect(
+          updateRun(storage, run.runId, 'run_failed', {
+            error: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+  });
+
+  describe('allowed operations on terminal runs', () => {
+    it('should allow step_completed on completed run for in-progress step', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create and start a step (making it in-progress)
+      await createStep(storage, run.runId, {
+        stepId: 'step_in_progress',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(storage, run.runId, 'step_in_progress', 'step_started');
+
+      // Complete the run while step is still running
+      await updateRun(storage, run.runId, 'run_completed', { output: 'done' });
+
+      // Should succeed - completing an in-progress step on a terminal run is allowed
+      const result = await updateStep(
+        storage,
+        run.runId,
+        'step_in_progress',
+        'step_completed',
+        { result: 'step done' }
+      );
+      expect(result.status).toBe('completed');
+    });
+
+    it('should allow step_failed on completed run for in-progress step', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create and start a step
+      await createStep(storage, run.runId, {
+        stepId: 'step_in_progress_fail',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(
+        storage,
+        run.runId,
+        'step_in_progress_fail',
+        'step_started'
+      );
+
+      // Complete the run
+      await updateRun(storage, run.runId, 'run_completed', { output: 'done' });
+
+      // Should succeed - failing an in-progress step on a terminal run is allowed
+      const result = await updateStep(
+        storage,
+        run.runId,
+        'step_in_progress_fail',
+        'step_failed',
+        { error: 'step failed' }
+      );
+      expect(result.status).toBe('failed');
+    });
+
+    it('should auto-delete hooks when run completes (world-local specific behavior)', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create a hook
+      await createHook(storage, run.runId, {
+        hookId: 'hook_auto_delete',
+        token: 'test-token-auto-delete',
+      });
+
+      // Verify hook exists before completion
+      const hookBefore = await storage.hooks.get('hook_auto_delete');
+      expect(hookBefore).toBeDefined();
+
+      // Complete the run - this auto-deletes hooks in world-local
+      await updateRun(storage, run.runId, 'run_completed', { output: 'done' });
+
+      // Hook should be auto-deleted
+      await expect(storage.hooks.get('hook_auto_delete')).rejects.toThrow(
+        /not found/i
+      );
+    });
+  });
+
+  describe('disallowed operations on terminal runs', () => {
+    it('should reject step_created on completed run', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await updateRun(storage, run.runId, 'run_completed', { output: 'done' });
+
+      await expect(
+        createStep(storage, run.runId, {
+          stepId: 'new_step',
+          stepName: 'test-step',
+          input: [],
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_started on completed run for pending step', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create a step but don't start it
+      await createStep(storage, run.runId, {
+        stepId: 'pending_step',
+        stepName: 'test-step',
+        input: [],
+      });
+
+      // Complete the run
+      await updateRun(storage, run.runId, 'run_completed', { output: 'done' });
+
+      // Should reject - cannot start a pending step on a terminal run
+      await expect(
+        updateStep(storage, run.runId, 'pending_step', 'step_started')
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject hook_created on completed run', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await updateRun(storage, run.runId, 'run_completed', { output: 'done' });
+
+      await expect(
+        createHook(storage, run.runId, {
+          hookId: 'new_hook',
+          token: 'new-token',
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_created on failed run', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await updateRun(storage, run.runId, 'run_failed', { error: 'Failed' });
+
+      await expect(
+        createStep(storage, run.runId, {
+          stepId: 'new_step_failed',
+          stepName: 'test-step',
+          input: [],
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_created on cancelled run', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await storage.events.create(run.runId, { eventType: 'run_cancelled' });
+
+      await expect(
+        createStep(storage, run.runId, {
+          stepId: 'new_step_cancelled',
+          stepName: 'test-step',
+          input: [],
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject hook_created on failed run', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await updateRun(storage, run.runId, 'run_failed', { error: 'Failed' });
+
+      await expect(
+        createHook(storage, run.runId, {
+          hookId: 'new_hook_failed',
+          token: 'new-token-failed',
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject hook_created on cancelled run', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await storage.events.create(run.runId, { eventType: 'run_cancelled' });
+
+      await expect(
+        createHook(storage, run.runId, {
+          hookId: 'new_hook_cancelled',
+          token: 'new-token-cancelled',
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+  });
+
+  describe('idempotent operations', () => {
+    it('should allow run_cancelled on already cancelled run (idempotent)', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await storage.events.create(run.runId, { eventType: 'run_cancelled' });
+
+      // Should succeed - idempotent operation
+      const result = await storage.events.create(run.runId, {
+        eventType: 'run_cancelled',
+      });
+      expect(result.run?.status).toBe('cancelled');
+    });
+  });
+
+  describe('step_retrying event handling', () => {
+    let testRunId: string;
+
+    beforeEach(async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      testRunId = run.runId;
+    });
+
+    it('should set step status to pending and record error', async () => {
+      await createStep(storage, testRunId, {
+        stepId: 'step_retry_1',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(storage, testRunId, 'step_retry_1', 'step_started');
+
+      const result = await storage.events.create(testRunId, {
+        eventType: 'step_retrying',
+        correlationId: 'step_retry_1',
+        eventData: {
+          error: 'Temporary failure',
+          retryAfter: new Date(Date.now() + 5000),
+        },
+      });
+
+      expect(result.step?.status).toBe('pending');
+      expect(result.step?.error?.message).toBe('Temporary failure');
+      expect(result.step?.retryAfter).toBeInstanceOf(Date);
+    });
+
+    it('should increment attempt when step_started is called after step_retrying', async () => {
+      await createStep(storage, testRunId, {
+        stepId: 'step_retry_2',
+        stepName: 'test-step',
+        input: [],
+      });
+
+      // First attempt
+      const started1 = await updateStep(
+        storage,
+        testRunId,
+        'step_retry_2',
+        'step_started'
+      );
+      expect(started1.attempt).toBe(1);
+
+      // Retry
+      await storage.events.create(testRunId, {
+        eventType: 'step_retrying',
+        correlationId: 'step_retry_2',
+        eventData: { error: 'Temporary failure' },
+      });
+
+      // Second attempt
+      const started2 = await updateStep(
+        storage,
+        testRunId,
+        'step_retry_2',
+        'step_started'
+      );
+      expect(started2.attempt).toBe(2);
+    });
+
+    it('should reject step_retrying on completed step', async () => {
+      await createStep(storage, testRunId, {
+        stepId: 'step_retry_completed',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(
+        storage,
+        testRunId,
+        'step_retry_completed',
+        'step_completed',
+        {
+          result: 'done',
+        }
+      );
+
+      await expect(
+        storage.events.create(testRunId, {
+          eventType: 'step_retrying',
+          correlationId: 'step_retry_completed',
+          eventData: { error: 'Should not work' },
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_retrying on failed step', async () => {
+      await createStep(storage, testRunId, {
+        stepId: 'step_retry_failed',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(storage, testRunId, 'step_retry_failed', 'step_failed', {
+        error: 'Permanent failure',
+      });
+
+      await expect(
+        storage.events.create(testRunId, {
+          eventType: 'step_retrying',
+          correlationId: 'step_retry_failed',
+          eventData: { error: 'Should not work' },
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+  });
+
+  describe('run cancellation with in-flight entities', () => {
+    it('should allow in-progress step to complete after run cancelled', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create and start a step
+      await createStep(storage, run.runId, {
+        stepId: 'step_in_flight',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(storage, run.runId, 'step_in_flight', 'step_started');
+
+      // Cancel the run
+      await storage.events.create(run.runId, { eventType: 'run_cancelled' });
+
+      // Should succeed - completing an in-progress step is allowed
+      const result = await updateStep(
+        storage,
+        run.runId,
+        'step_in_flight',
+        'step_completed',
+        { result: 'done' }
+      );
+      expect(result.status).toBe('completed');
+    });
+
+    it('should reject step_created after run cancelled', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await storage.events.create(run.runId, { eventType: 'run_cancelled' });
+
+      await expect(
+        createStep(storage, run.runId, {
+          stepId: 'new_step_after_cancel',
+          stepName: 'test-step',
+          input: [],
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_started for pending step after run cancelled', async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create a step but don't start it
+      await createStep(storage, run.runId, {
+        stepId: 'pending_after_cancel',
+        stepName: 'test-step',
+        input: [],
+      });
+
+      // Cancel the run
+      await storage.events.create(run.runId, { eventType: 'run_cancelled' });
+
+      // Should reject - cannot start a pending step on a cancelled run
+      await expect(
+        updateStep(storage, run.runId, 'pending_after_cancel', 'step_started')
+      ).rejects.toThrow(/terminal/i);
+    });
+  });
+
+  describe('event ordering validation', () => {
+    let testRunId: string;
+
+    beforeEach(async () => {
+      const run = await createRun(storage, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      testRunId = run.runId;
+    });
+
+    it('should reject step_completed before step_created', async () => {
+      await expect(
+        storage.events.create(testRunId, {
+          eventType: 'step_completed',
+          correlationId: 'nonexistent_step',
+          eventData: { result: 'done' },
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+
+    it('should reject step_started before step_created', async () => {
+      await expect(
+        storage.events.create(testRunId, {
+          eventType: 'step_started',
+          correlationId: 'nonexistent_step_started',
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+
+    it('should reject step_failed before step_created', async () => {
+      await expect(
+        storage.events.create(testRunId, {
+          eventType: 'step_failed',
+          correlationId: 'nonexistent_step_failed',
+          eventData: { error: 'Failed' },
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+
+    it('should allow step_completed without step_started (instant completion)', async () => {
+      await createStep(storage, testRunId, {
+        stepId: 'instant_complete',
+        stepName: 'test-step',
+        input: [],
+      });
+
+      // Should succeed - instant completion without starting
+      const result = await updateStep(
+        storage,
+        testRunId,
+        'instant_complete',
+        'step_completed',
+        { result: 'instant' }
+      );
+      expect(result.status).toBe('completed');
+    });
+
+    it('should reject hook_disposed before hook_created', async () => {
+      await expect(
+        storage.events.create(testRunId, {
+          eventType: 'hook_disposed',
+          correlationId: 'nonexistent_hook',
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+
+    it('should reject hook_received before hook_created', async () => {
+      await expect(
+        storage.events.create(testRunId, {
+          eventType: 'hook_received',
+          correlationId: 'nonexistent_hook_received',
+          eventData: { payload: {} },
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+  });
 });
diff --git a/packages/world-local/src/storage.ts b/packages/world-local/src/storage.ts
index fcb7941c4..8cf201deb 100644
--- a/packages/world-local/src/storage.ts
+++ b/packages/world-local/src/storage.ts
@@ -319,6 +319,147 @@ export function createStorage(basedir: string): Storage {
           effectiveRunId = runId;
         }
 
+        // Helper to check if run is in terminal state
+        const isRunTerminal = (status: string) =>
+          ['completed', 'failed', 'cancelled'].includes(status);
+
+        // Helper to check if step is in terminal state
+        const isStepTerminal = (status: string) =>
+          ['completed', 'failed'].includes(status);
+
+        // Get current run state for validation (if not creating a new run)
+        let currentRun: WorkflowRun | null = null;
+        if (data.eventType !== 'run_created') {
+          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
+          currentRun = await readJSON(runPath, WorkflowRunSchema);
+        }
+
+        // ============================================================
+        // VALIDATION: Terminal state and event ordering checks
+        // ============================================================
+
+        // Run terminal state validation
+        if (currentRun && isRunTerminal(currentRun.status)) {
+          const runTerminalEvents = [
+            'run_started',
+            'run_completed',
+            'run_failed',
+          ];
+
+          // Idempotent operation: run_cancelled on already cancelled run is allowed
+          if (
+            data.eventType === 'run_cancelled' &&
+            currentRun.status === 'cancelled'
+          ) {
+            // Return existing state (idempotent)
+            const event: Event = {
+              ...data,
+              runId: effectiveRunId,
+              eventId,
+              createdAt: now,
+            };
+            const compositeKey = `${effectiveRunId}-${eventId}`;
+            const eventPath = path.join(
+              basedir,
+              'events',
+              `${compositeKey}.json`
+            );
+            await writeJSON(eventPath, event);
+            const resolveData =
+              params?.resolveData ?? DEFAULT_RESOLVE_DATA_OPTION;
+            return {
+              event: filterEventData(event, resolveData),
+              run: currentRun,
+            };
+          }
+
+          // Run state transitions are not allowed on terminal runs
+          if (
+            runTerminalEvents.includes(data.eventType) ||
+            data.eventType === 'run_cancelled'
+          ) {
+            throw new WorkflowAPIError(
+              `Cannot transition run from terminal state "${currentRun.status}"`,
+              { status: 409 }
+            );
+          }
+
+          // Creating new entities on terminal runs is not allowed
+          if (
+            data.eventType === 'step_created' ||
+            data.eventType === 'hook_created'
+          ) {
+            throw new WorkflowAPIError(
+              `Cannot create new entities on run in terminal state "${currentRun.status}"`,
+              { status: 409 }
+            );
+          }
+        }
+
+        // Step-related event validation (ordering and terminal state)
+        const stepEvents = [
+          'step_started',
+          'step_completed',
+          'step_failed',
+          'step_retrying',
+        ];
+        if (stepEvents.includes(data.eventType) && data.correlationId) {
+          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+          const stepPath = path.join(
+            basedir,
+            'steps',
+            `${stepCompositeKey}.json`
+          );
+          const existingStep = await readJSON(stepPath, StepSchema);
+
+          // Event ordering: step must exist before these events
+          if (!existingStep) {
+            throw new WorkflowAPIError(
+              `Step "${data.correlationId}" not found`,
+              { status: 404 }
+            );
+          }
+
+          // Step terminal state validation
+          if (isStepTerminal(existingStep.status)) {
+            throw new WorkflowAPIError(
+              `Cannot modify step in terminal state "${existingStep.status}"`,
+              { status: 409 }
+            );
+          }
+
+          // On terminal runs: only allow completing/failing in-progress steps
+          if (currentRun && isRunTerminal(currentRun.status)) {
+            if (existingStep.status !== 'running') {
+              throw new WorkflowAPIError(
+                `Cannot modify non-running step on run in terminal state "${currentRun.status}"`,
+                { status: 409 }
+              );
+            }
+          }
+        }
+
+        // Hook-related event validation (ordering)
+        const hookEventsRequiringExistence = ['hook_disposed', 'hook_received'];
+        if (
+          hookEventsRequiringExistence.includes(data.eventType) &&
+          data.correlationId
+        ) {
+          const hookPath = path.join(
+            basedir,
+            'hooks',
+            `${data.correlationId}.json`
+          );
+          const existingHook = await readJSON(hookPath, HookSchema);
+
+          if (!existingHook) {
+            throw new WorkflowAPIError(
+              `Hook "${data.correlationId}" not found`,
+              { status: 404 }
+            );
+          }
+        }
+
         const event: Event = {
           ...data,
           runId: effectiveRunId,
diff --git a/packages/world-postgres/test/storage.test.ts b/packages/world-postgres/test/storage.test.ts
index fb1d730c0..f35929181 100644
--- a/packages/world-postgres/test/storage.test.ts
+++ b/packages/world-postgres/test/storage.test.ts
@@ -1011,4 +1011,763 @@ describe('Storage (Postgres integration)', () => {
       });
     });
   });
+
+  describe('step terminal state validation', () => {
+    let testRunId: string;
+
+    beforeEach(async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      testRunId = run.runId;
+    });
+
+    describe('completed step', () => {
+      it('should reject step_started on completed step', async () => {
+        await createStep(events, testRunId, {
+          stepId: 'step_terminal_1',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          events,
+          testRunId,
+          'step_terminal_1',
+          'step_completed',
+          {
+            result: 'done',
+          }
+        );
+
+        await expect(
+          updateStep(events, testRunId, 'step_terminal_1', 'step_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject step_completed on already completed step', async () => {
+        await createStep(events, testRunId, {
+          stepId: 'step_terminal_2',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          events,
+          testRunId,
+          'step_terminal_2',
+          'step_completed',
+          {
+            result: 'done',
+          }
+        );
+
+        await expect(
+          updateStep(events, testRunId, 'step_terminal_2', 'step_completed', {
+            result: 'done again',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject step_failed on completed step', async () => {
+        await createStep(events, testRunId, {
+          stepId: 'step_terminal_3',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          events,
+          testRunId,
+          'step_terminal_3',
+          'step_completed',
+          {
+            result: 'done',
+          }
+        );
+
+        await expect(
+          updateStep(events, testRunId, 'step_terminal_3', 'step_failed', {
+            error: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+
+    describe('failed step', () => {
+      it('should reject step_started on failed step', async () => {
+        await createStep(events, testRunId, {
+          stepId: 'step_failed_1',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(events, testRunId, 'step_failed_1', 'step_failed', {
+          error: 'Failed permanently',
+        });
+
+        await expect(
+          updateStep(events, testRunId, 'step_failed_1', 'step_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject step_completed on failed step', async () => {
+        await createStep(events, testRunId, {
+          stepId: 'step_failed_2',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(events, testRunId, 'step_failed_2', 'step_failed', {
+          error: 'Failed permanently',
+        });
+
+        await expect(
+          updateStep(events, testRunId, 'step_failed_2', 'step_completed', {
+            result: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject step_failed on already failed step', async () => {
+        await createStep(events, testRunId, {
+          stepId: 'step_failed_3',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(events, testRunId, 'step_failed_3', 'step_failed', {
+          error: 'Failed once',
+        });
+
+        await expect(
+          updateStep(events, testRunId, 'step_failed_3', 'step_failed', {
+            error: 'Failed again',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+  });
+
+  describe('run terminal state validation', () => {
+    describe('completed run', () => {
+      it('should reject run_started on completed run', async () => {
+        const run = await createRun(events, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(events, run.runId, 'run_completed', { output: 'done' });
+
+        await expect(
+          updateRun(events, run.runId, 'run_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_failed on completed run', async () => {
+        const run = await createRun(events, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(events, run.runId, 'run_completed', { output: 'done' });
+
+        await expect(
+          updateRun(events, run.runId, 'run_failed', {
+            error: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_cancelled on completed run', async () => {
+        const run = await createRun(events, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(events, run.runId, 'run_completed', { output: 'done' });
+
+        await expect(
+          events.create(run.runId, { eventType: 'run_cancelled' })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+
+    describe('failed run', () => {
+      it('should reject run_started on failed run', async () => {
+        const run = await createRun(events, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(events, run.runId, 'run_failed', { error: 'Failed' });
+
+        await expect(
+          updateRun(events, run.runId, 'run_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_completed on failed run', async () => {
+        const run = await createRun(events, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(events, run.runId, 'run_failed', { error: 'Failed' });
+
+        await expect(
+          updateRun(events, run.runId, 'run_completed', {
+            output: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_cancelled on failed run', async () => {
+        const run = await createRun(events, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await updateRun(events, run.runId, 'run_failed', { error: 'Failed' });
+
+        await expect(
+          events.create(run.runId, { eventType: 'run_cancelled' })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+
+    describe('cancelled run', () => {
+      it('should reject run_started on cancelled run', async () => {
+        const run = await createRun(events, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await events.create(run.runId, { eventType: 'run_cancelled' });
+
+        await expect(
+          updateRun(events, run.runId, 'run_started')
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_completed on cancelled run', async () => {
+        const run = await createRun(events, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await events.create(run.runId, { eventType: 'run_cancelled' });
+
+        await expect(
+          updateRun(events, run.runId, 'run_completed', {
+            output: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+
+      it('should reject run_failed on cancelled run', async () => {
+        const run = await createRun(events, {
+          deploymentId: 'deployment-123',
+          workflowName: 'test-workflow',
+          input: [],
+        });
+        await events.create(run.runId, { eventType: 'run_cancelled' });
+
+        await expect(
+          updateRun(events, run.runId, 'run_failed', {
+            error: 'Should not work',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+  });
+
+  describe('allowed operations on terminal runs', () => {
+    it('should allow step_completed on completed run for in-progress step', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create and start a step (making it in-progress)
+      await createStep(events, run.runId, {
+        stepId: 'step_in_progress',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(events, run.runId, 'step_in_progress', 'step_started');
+
+      // Complete the run while step is still running
+      await updateRun(events, run.runId, 'run_completed', { output: 'done' });
+
+      // Should succeed - completing an in-progress step on a terminal run is allowed
+      const result = await updateStep(
+        events,
+        run.runId,
+        'step_in_progress',
+        'step_completed',
+        { result: 'step done' }
+      );
+      expect(result.status).toBe('completed');
+    });
+
+    it('should allow step_failed on completed run for in-progress step', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create and start a step
+      await createStep(events, run.runId, {
+        stepId: 'step_in_progress_fail',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(
+        events,
+        run.runId,
+        'step_in_progress_fail',
+        'step_started'
+      );
+
+      // Complete the run
+      await updateRun(events, run.runId, 'run_completed', { output: 'done' });
+
+      // Should succeed - failing an in-progress step on a terminal run is allowed
+      const result = await updateStep(
+        events,
+        run.runId,
+        'step_in_progress_fail',
+        'step_failed',
+        { error: 'step failed' }
+      );
+      expect(result.status).toBe('failed');
+    });
+
+    it('should allow hook_disposed on completed run', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create a hook
+      await createHook(events, run.runId, {
+        hookId: 'hook_to_dispose',
+        token: 'test-token-dispose',
+      });
+
+      // Complete the run
+      await updateRun(events, run.runId, 'run_completed', { output: 'done' });
+
+      // Should succeed - disposing a hook on a terminal run is allowed
+      await expect(
+        events.create(run.runId, {
+          eventType: 'hook_disposed',
+          correlationId: 'hook_to_dispose',
+        })
+      ).resolves.not.toThrow();
+    });
+  });
+
+  describe('disallowed operations on terminal runs', () => {
+    it('should reject step_created on completed run', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await updateRun(events, run.runId, 'run_completed', { output: 'done' });
+
+      await expect(
+        createStep(events, run.runId, {
+          stepId: 'new_step',
+          stepName: 'test-step',
+          input: [],
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_started on completed run for pending step', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create a step but don't start it
+      await createStep(events, run.runId, {
+        stepId: 'pending_step',
+        stepName: 'test-step',
+        input: [],
+      });
+
+      // Complete the run
+      await updateRun(events, run.runId, 'run_completed', { output: 'done' });
+
+      // Should reject - cannot start a pending step on a terminal run
+      await expect(
+        updateStep(events, run.runId, 'pending_step', 'step_started')
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject hook_created on completed run', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await updateRun(events, run.runId, 'run_completed', { output: 'done' });
+
+      await expect(
+        createHook(events, run.runId, {
+          hookId: 'new_hook',
+          token: 'new-token',
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_created on failed run', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await updateRun(events, run.runId, 'run_failed', { error: 'Failed' });
+
+      await expect(
+        createStep(events, run.runId, {
+          stepId: 'new_step_failed',
+          stepName: 'test-step',
+          input: [],
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_created on cancelled run', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await events.create(run.runId, { eventType: 'run_cancelled' });
+
+      await expect(
+        createStep(events, run.runId, {
+          stepId: 'new_step_cancelled',
+          stepName: 'test-step',
+          input: [],
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject hook_created on failed run', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await updateRun(events, run.runId, 'run_failed', { error: 'Failed' });
+
+      await expect(
+        createHook(events, run.runId, {
+          hookId: 'new_hook_failed',
+          token: 'new-token-failed',
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject hook_created on cancelled run', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await events.create(run.runId, { eventType: 'run_cancelled' });
+
+      await expect(
+        createHook(events, run.runId, {
+          hookId: 'new_hook_cancelled',
+          token: 'new-token-cancelled',
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+  });
+
+  describe('idempotent operations', () => {
+    it('should allow run_cancelled on already cancelled run (idempotent)', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await events.create(run.runId, { eventType: 'run_cancelled' });
+
+      // Should succeed - idempotent operation
+      const result = await events.create(run.runId, {
+        eventType: 'run_cancelled',
+      });
+      expect(result.run?.status).toBe('cancelled');
+    });
+  });
+
+  describe('step_retrying event handling', () => {
+    let testRunId: string;
+
+    beforeEach(async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      testRunId = run.runId;
+    });
+
+    it('should set step status to pending and record error', async () => {
+      await createStep(events, testRunId, {
+        stepId: 'step_retry_1',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(events, testRunId, 'step_retry_1', 'step_started');
+
+      const result = await events.create(testRunId, {
+        eventType: 'step_retrying',
+        correlationId: 'step_retry_1',
+        eventData: {
+          error: 'Temporary failure',
+          retryAfter: new Date(Date.now() + 5000),
+        },
+      });
+
+      expect(result.step?.status).toBe('pending');
+      expect(result.step?.error?.message).toBe('Temporary failure');
+      expect(result.step?.retryAfter).toBeInstanceOf(Date);
+    });
+
+    it('should increment attempt when step_started is called after step_retrying', async () => {
+      await createStep(events, testRunId, {
+        stepId: 'step_retry_2',
+        stepName: 'test-step',
+        input: [],
+      });
+
+      // First attempt
+      const started1 = await updateStep(
+        events,
+        testRunId,
+        'step_retry_2',
+        'step_started'
+      );
+      expect(started1.attempt).toBe(1);
+
+      // Retry
+      await events.create(testRunId, {
+        eventType: 'step_retrying',
+        correlationId: 'step_retry_2',
+        eventData: { error: 'Temporary failure' },
+      });
+
+      // Second attempt
+      const started2 = await updateStep(
+        events,
+        testRunId,
+        'step_retry_2',
+        'step_started'
+      );
+      expect(started2.attempt).toBe(2);
+    });
+
+    it('should reject step_retrying on completed step', async () => {
+      await createStep(events, testRunId, {
+        stepId: 'step_retry_completed',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(
+        events,
+        testRunId,
+        'step_retry_completed',
+        'step_completed',
+        {
+          result: 'done',
+        }
+      );
+
+      await expect(
+        events.create(testRunId, {
+          eventType: 'step_retrying',
+          correlationId: 'step_retry_completed',
+          eventData: { error: 'Should not work' },
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_retrying on failed step', async () => {
+      await createStep(events, testRunId, {
+        stepId: 'step_retry_failed',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(events, testRunId, 'step_retry_failed', 'step_failed', {
+        error: 'Permanent failure',
+      });
+
+      await expect(
+        events.create(testRunId, {
+          eventType: 'step_retrying',
+          correlationId: 'step_retry_failed',
+          eventData: { error: 'Should not work' },
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+  });
+
+  describe('run cancellation with in-flight entities', () => {
+    it('should allow in-progress step to complete after run cancelled', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create and start a step
+      await createStep(events, run.runId, {
+        stepId: 'step_in_flight',
+        stepName: 'test-step',
+        input: [],
+      });
+      await updateStep(events, run.runId, 'step_in_flight', 'step_started');
+
+      // Cancel the run
+      await events.create(run.runId, { eventType: 'run_cancelled' });
+
+      // Should succeed - completing an in-progress step is allowed
+      const result = await updateStep(
+        events,
+        run.runId,
+        'step_in_flight',
+        'step_completed',
+        { result: 'done' }
+      );
+      expect(result.status).toBe('completed');
+    });
+
+    it('should reject step_created after run cancelled', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      await events.create(run.runId, { eventType: 'run_cancelled' });
+
+      await expect(
+        createStep(events, run.runId, {
+          stepId: 'new_step_after_cancel',
+          stepName: 'test-step',
+          input: [],
+        })
+      ).rejects.toThrow(/terminal/i);
+    });
+
+    it('should reject step_started for pending step after run cancelled', async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+
+      // Create a step but don't start it
+      await createStep(events, run.runId, {
+        stepId: 'pending_after_cancel',
+        stepName: 'test-step',
+        input: [],
+      });
+
+      // Cancel the run
+      await events.create(run.runId, { eventType: 'run_cancelled' });
+
+      // Should reject - cannot start a pending step on a cancelled run
+      await expect(
+        updateStep(events, run.runId, 'pending_after_cancel', 'step_started')
+      ).rejects.toThrow(/terminal/i);
+    });
+  });
+
+  describe('event ordering validation', () => {
+    let testRunId: string;
+
+    beforeEach(async () => {
+      const run = await createRun(events, {
+        deploymentId: 'deployment-123',
+        workflowName: 'test-workflow',
+        input: [],
+      });
+      testRunId = run.runId;
+    });
+
+    it('should reject step_completed before step_created', async () => {
+      await expect(
+        events.create(testRunId, {
+          eventType: 'step_completed',
+          correlationId: 'nonexistent_step',
+          eventData: { result: 'done' },
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+
+    it('should reject step_started before step_created', async () => {
+      await expect(
+        events.create(testRunId, {
+          eventType: 'step_started',
+          correlationId: 'nonexistent_step_started',
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+
+    it('should reject step_failed before step_created', async () => {
+      await expect(
+        events.create(testRunId, {
+          eventType: 'step_failed',
+          correlationId: 'nonexistent_step_failed',
+          eventData: { error: 'Failed' },
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+
+    it('should allow step_completed without step_started (instant completion)', async () => {
+      await createStep(events, testRunId, {
+        stepId: 'instant_complete',
+        stepName: 'test-step',
+        input: [],
+      });
+
+      // Should succeed - instant completion without starting
+      const result = await updateStep(
+        events,
+        testRunId,
+        'instant_complete',
+        'step_completed',
+        { result: 'instant' }
+      );
+      expect(result.status).toBe('completed');
+    });
+
+    it('should reject hook_disposed before hook_created', async () => {
+      await expect(
+        events.create(testRunId, {
+          eventType: 'hook_disposed',
+          correlationId: 'nonexistent_hook',
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+
+    it('should reject hook_received before hook_created', async () => {
+      await expect(
+        events.create(testRunId, {
+          eventType: 'hook_received',
+          correlationId: 'nonexistent_hook_received',
+          eventData: { payload: {} },
+        })
+      ).rejects.toThrow(/not found/i);
+    });
+  });
 });

From 7419729cc98f8b1da0e18d9f51ac66bfa58f2b60 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 19:41:24 -0800
Subject: [PATCH 17/27] Add terminal state validation to world-postgres and
 rename firstStartedAt back to startedAt
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add terminal state validation logic to world-postgres storage matching world-local
- Fix world-postgres tests to create steps before step events
- Fix hook_disposed test to document auto-delete behavior on run completion
- Rename firstStartedAt back to startedAt throughout the codebase (matches main branch)
- Update world-vercel wire schemas (no longer need startedAt -> firstStartedAt mapping)

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/cli/src/lib/inspect/output.ts        |   2 +-
 packages/core/src/runtime/step-handler.ts     |   6 +-
 .../src/sidebar/attribute-panel.tsx           |   2 -
 .../trace-span-construction.ts                |   4 +-
 .../lib/flow-graph/graph-execution-mapper.ts  |   8 +-
 packages/world-local/src/storage.test.ts      |   4 +-
 packages/world-local/src/storage.ts           |   8 +-
 packages/world-postgres/src/drizzle/schema.ts |   6 +-
 packages/world-postgres/src/storage.ts        | 163 ++++++++++++++-
 packages/world-postgres/test/storage.test.ts  | 185 ++++++++++++++----
 packages/world-vercel/src/events.ts           |   8 +-
 packages/world-vercel/src/steps.ts            |  15 +-
 packages/world/src/steps.ts                   |   2 +-
 13 files changed, 328 insertions(+), 85 deletions(-)

diff --git a/packages/cli/src/lib/inspect/output.ts b/packages/cli/src/lib/inspect/output.ts
index b0cf8137a..67cf974b0 100644
--- a/packages/cli/src/lib/inspect/output.ts
+++ b/packages/cli/src/lib/inspect/output.ts
@@ -50,7 +50,7 @@ const STEP_LISTED_PROPS: (keyof Step)[] = [
   'stepId',
   'stepName',
   'status',
-  'firstStartedAt',
+  'startedAt',
   'completedAt',
   ...STEP_IO_PROPS,
 ];
diff --git a/packages/core/src/runtime/step-handler.ts b/packages/core/src/runtime/step-handler.ts
index 42a1f4434..771c7f25a 100644
--- a/packages/core/src/runtime/step-handler.ts
+++ b/packages/core/src/runtime/step-handler.ts
@@ -203,9 +203,9 @@ const stepHandler = getWorldHandlers().createQueueHandler(
             // step.attempt is now the current attempt number (after increment)
             const attempt = step.attempt;
 
-            if (!step.firstStartedAt) {
+            if (!step.startedAt) {
               throw new WorkflowRuntimeError(
-                `Step "${stepId}" has no "firstStartedAt" timestamp`
+                `Step "${stepId}" has no "startedAt" timestamp`
               );
             }
             // Hydrate the step input arguments and closure variables
@@ -226,7 +226,7 @@ const stepHandler = getWorldHandlers().createQueueHandler(
               {
                 stepMetadata: {
                   stepId,
-                  stepStartedAt: new Date(+step.firstStartedAt),
+                  stepStartedAt: new Date(+step.startedAt),
                   attempt,
                 },
                 workflowMetadata: {
diff --git a/packages/web-shared/src/sidebar/attribute-panel.tsx b/packages/web-shared/src/sidebar/attribute-panel.tsx
index 0a521e7b1..b6adc75bd 100644
--- a/packages/web-shared/src/sidebar/attribute-panel.tsx
+++ b/packages/web-shared/src/sidebar/attribute-panel.tsx
@@ -304,7 +304,6 @@ const attributeOrder: AttributeKey[] = [
   'executionContext',
   'createdAt',
   'startedAt',
-  'firstStartedAt',
   'updatedAt',
   'completedAt',
   'expiredAt',
@@ -383,7 +382,6 @@ const attributeToDisplayFn: Record<
   // TODO: relative time with tooltips for ISO times
   createdAt: localMillisecondTime,
   startedAt: localMillisecondTime,
-  firstStartedAt: localMillisecondTime,
   updatedAt: localMillisecondTime,
   completedAt: localMillisecondTime,
   expiredAt: localMillisecondTime,
diff --git a/packages/web-shared/src/workflow-traces/trace-span-construction.ts b/packages/web-shared/src/workflow-traces/trace-span-construction.ts
index 74bd4719d..53e4e92d1 100644
--- a/packages/web-shared/src/workflow-traces/trace-span-construction.ts
+++ b/packages/web-shared/src/workflow-traces/trace-span-construction.ts
@@ -145,9 +145,7 @@ export function stepToSpan(
   // Use createdAt as span start time, with activeStartTime for when execution began
   // This allows visualization of the "queued" period before execution
   const spanStartTime = new Date(step.createdAt);
-  let activeStartTime = step.firstStartedAt
-    ? new Date(step.firstStartedAt)
-    : undefined;
+  let activeStartTime = step.startedAt ? new Date(step.startedAt) : undefined;
   const firstStartEvent = stepEvents.find(
     (event) => event.eventType === 'step_started'
   );
diff --git a/packages/web/src/lib/flow-graph/graph-execution-mapper.ts b/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
index 2655b9738..9c05f5f15 100644
--- a/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
+++ b/packages/web/src/lib/flow-graph/graph-execution-mapper.ts
@@ -54,9 +54,9 @@ function createStepExecution(
   }
 
   const duration =
-    attemptStep.completedAt && attemptStep.firstStartedAt
+    attemptStep.completedAt && attemptStep.startedAt
       ? new Date(attemptStep.completedAt).getTime() -
-        new Date(attemptStep.firstStartedAt).getTime()
+        new Date(attemptStep.startedAt).getTime()
       : undefined;
 
   return {
@@ -64,8 +64,8 @@ function createStepExecution(
     stepId: attemptStep.stepId,
     attemptNumber: attemptStep.attempt,
     status,
-    startedAt: attemptStep.firstStartedAt
-      ? new Date(attemptStep.firstStartedAt).toISOString()
+    startedAt: attemptStep.startedAt
+      ? new Date(attemptStep.startedAt).toISOString()
       : undefined,
     completedAt: attemptStep.completedAt
       ? new Date(attemptStep.completedAt).toISOString()
diff --git a/packages/world-local/src/storage.test.ts b/packages/world-local/src/storage.test.ts
index 1bdcd3f56..eff9dce40 100644
--- a/packages/world-local/src/storage.test.ts
+++ b/packages/world-local/src/storage.test.ts
@@ -365,7 +365,7 @@ describe('Storage', () => {
         expect(step.output).toBeUndefined();
         expect(step.error).toBeUndefined();
         expect(step.attempt).toBe(0);
-        expect(step.firstStartedAt).toBeUndefined();
+        expect(step.startedAt).toBeUndefined();
         expect(step.completedAt).toBeUndefined();
         expect(step.createdAt).toBeInstanceOf(Date);
         expect(step.updatedAt).toBeInstanceOf(Date);
@@ -433,7 +433,7 @@ describe('Storage', () => {
         );
 
         expect(updated.status).toBe('running');
-        expect(updated.firstStartedAt).toBeInstanceOf(Date);
+        expect(updated.startedAt).toBeInstanceOf(Date);
         expect(updated.attempt).toBe(1); // Incremented by step_started
       });
 
diff --git a/packages/world-local/src/storage.ts b/packages/world-local/src/storage.ts
index 8cf201deb..1df7f1e0e 100644
--- a/packages/world-local/src/storage.ts
+++ b/packages/world-local/src/storage.ts
@@ -615,7 +615,7 @@ export function createStorage(basedir: string): Storage {
             output: undefined,
             error: undefined,
             attempt: 0,
-            firstStartedAt: undefined,
+            startedAt: undefined,
             completedAt: undefined,
             createdAt: now,
             updatedAt: now,
@@ -629,7 +629,7 @@ export function createStorage(basedir: string): Storage {
           await writeJSON(stepPath, step);
         } else if (data.eventType === 'step_started') {
           // step_started: Increments attempt, sets status to 'running'
-          // Sets firstStartedAt only on the first start (not updated on retries)
+          // Sets startedAt only on the first start (not updated on retries)
           const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
           const stepPath = path.join(
             basedir,
@@ -641,8 +641,8 @@ export function createStorage(basedir: string): Storage {
             step = {
               ...existingStep,
               status: 'running',
-              // Only set firstStartedAt on the first start
-              firstStartedAt: existingStep.firstStartedAt ?? now,
+              // Only set startedAt on the first start
+              startedAt: existingStep.startedAt ?? now,
               // Increment attempt counter on every start
               attempt: existingStep.attempt + 1,
               updatedAt: now,
diff --git a/packages/world-postgres/src/drizzle/schema.ts b/packages/world-postgres/src/drizzle/schema.ts
index d5e43224d..0da98e369 100644
--- a/packages/world-postgres/src/drizzle/schema.ts
+++ b/packages/world-postgres/src/drizzle/schema.ts
@@ -108,7 +108,7 @@ export const events = schema.table(
 /**
  * Database schema for steps. Note: DB column names differ from Step interface:
  * - error (DB) → error (Step interface, parsed from JSON string)
- * - startedAt (DB) → firstStartedAt (Step interface)
+ * - startedAt (DB) → startedAt (Step interface)
  * The mapping is done in storage.ts deserializeStepError()
  */
 export const steps = schema.table(
@@ -127,7 +127,7 @@ export const steps = schema.table(
     /** JSON-stringified StructuredError - parsed and set as error in Step interface */
     error: text('error'),
     attempt: integer('attempt').notNull(),
-    /** Maps to firstStartedAt in Step interface */
+    /** Maps to startedAt in Step interface */
     startedAt: timestamp('started_at'),
     completedAt: timestamp('completed_at'),
     createdAt: timestamp('created_at').defaultNow().notNull(),
@@ -138,7 +138,7 @@ export const steps = schema.table(
     retryAfter: timestamp('retry_after'),
   } satisfies DrizzlishOfType<
     Cborized<
-      Omit<Step, 'input' | 'error' | 'firstStartedAt'> & {
+      Omit<Step, 'input' | 'error' | 'startedAt'> & {
         input?: unknown;
         error?: string;
         startedAt?: Date;
diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index a0a32443a..d6e526f1a 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -70,15 +70,15 @@ function deserializeRunError(run: any): WorkflowRun {
 /**
  * Deserialize step data, mapping DB columns to interface fields:
  * - `error` (DB column) → `error` (Step interface, parsed from JSON)
- * - `startedAt` (DB column) → `firstStartedAt` (Step interface)
+ * - `startedAt` (DB column) → `startedAt` (Step interface)
  */
 function deserializeStepError(step: any): Step {
   const { error, startedAt, ...rest } = step;
 
   const result: any = {
     ...rest,
-    // Map startedAt to firstStartedAt
-    firstStartedAt: startedAt,
+    // Map startedAt to startedAt
+    startedAt: startedAt,
   };
 
   if (!error) {
@@ -191,6 +191,161 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
       let hook: Hook | undefined;
       const now = new Date();
 
+      // Helper to check if run is in terminal state
+      const isRunTerminal = (status: string) =>
+        ['completed', 'failed', 'cancelled'].includes(status);
+
+      // Helper to check if step is in terminal state
+      const isStepTerminal = (status: string) =>
+        ['completed', 'failed'].includes(status);
+
+      // ============================================================
+      // VALIDATION: Terminal state and event ordering checks
+      // ============================================================
+
+      // Get current run state for validation (if not creating a new run)
+      let currentRun: { status: string } | null = null;
+      if (data.eventType !== 'run_created') {
+        const [runValue] = await drizzle
+          .select({ status: Schema.runs.status })
+          .from(Schema.runs)
+          .where(eq(Schema.runs.runId, effectiveRunId))
+          .limit(1);
+        currentRun = runValue ?? null;
+      }
+
+      // Run terminal state validation
+      if (currentRun && isRunTerminal(currentRun.status)) {
+        const runTerminalEvents = [
+          'run_started',
+          'run_completed',
+          'run_failed',
+        ];
+
+        // Idempotent operation: run_cancelled on already cancelled run is allowed
+        if (
+          data.eventType === 'run_cancelled' &&
+          currentRun.status === 'cancelled'
+        ) {
+          // Get full run for return value
+          const [fullRun] = await drizzle
+            .select()
+            .from(Schema.runs)
+            .where(eq(Schema.runs.runId, effectiveRunId))
+            .limit(1);
+
+          // Create the event (still record it)
+          const [value] = await drizzle
+            .insert(Schema.events)
+            .values({
+              runId: effectiveRunId,
+              eventId,
+              correlationId: data.correlationId,
+              eventType: data.eventType,
+              eventData: 'eventData' in data ? data.eventData : undefined,
+            })
+            .returning({ createdAt: Schema.events.createdAt });
+
+          const result = { ...data, ...value, runId: effectiveRunId, eventId };
+          const parsed = EventSchema.parse(result);
+          const resolveData = params?.resolveData ?? 'all';
+          return {
+            event: filterEventData(parsed, resolveData),
+            run: fullRun ? deserializeRunError(compact(fullRun)) : undefined,
+          };
+        }
+
+        // Run state transitions are not allowed on terminal runs
+        if (
+          runTerminalEvents.includes(data.eventType) ||
+          data.eventType === 'run_cancelled'
+        ) {
+          throw new WorkflowAPIError(
+            `Cannot transition run from terminal state "${currentRun.status}"`,
+            { status: 409 }
+          );
+        }
+
+        // Creating new entities on terminal runs is not allowed
+        if (
+          data.eventType === 'step_created' ||
+          data.eventType === 'hook_created'
+        ) {
+          throw new WorkflowAPIError(
+            `Cannot create new entities on run in terminal state "${currentRun.status}"`,
+            { status: 409 }
+          );
+        }
+      }
+
+      // Step-related event validation (ordering and terminal state)
+      const stepEvents = [
+        'step_started',
+        'step_completed',
+        'step_failed',
+        'step_retrying',
+      ];
+      if (stepEvents.includes(data.eventType) && data.correlationId) {
+        const [existingStep] = await drizzle
+          .select({ status: Schema.steps.status })
+          .from(Schema.steps)
+          .where(
+            and(
+              eq(Schema.steps.runId, effectiveRunId),
+              eq(Schema.steps.stepId, data.correlationId)
+            )
+          )
+          .limit(1);
+
+        // Event ordering: step must exist before these events
+        if (!existingStep) {
+          throw new WorkflowAPIError(`Step "${data.correlationId}" not found`, {
+            status: 404,
+          });
+        }
+
+        // Step terminal state validation
+        if (isStepTerminal(existingStep.status)) {
+          throw new WorkflowAPIError(
+            `Cannot modify step in terminal state "${existingStep.status}"`,
+            { status: 409 }
+          );
+        }
+
+        // On terminal runs: only allow completing/failing in-progress steps
+        if (currentRun && isRunTerminal(currentRun.status)) {
+          if (existingStep.status !== 'running') {
+            throw new WorkflowAPIError(
+              `Cannot modify non-running step on run in terminal state "${currentRun.status}"`,
+              { status: 409 }
+            );
+          }
+        }
+      }
+
+      // Hook-related event validation (ordering)
+      const hookEventsRequiringExistence = ['hook_disposed', 'hook_received'];
+      if (
+        hookEventsRequiringExistence.includes(data.eventType) &&
+        data.correlationId
+      ) {
+        const [existingHook] = await drizzle
+          .select({ hookId: Schema.hooks.hookId })
+          .from(Schema.hooks)
+          .where(eq(Schema.hooks.hookId, data.correlationId))
+          .limit(1);
+
+        if (!existingHook) {
+          throw new WorkflowAPIError(`Hook "${data.correlationId}" not found`, {
+            status: 404,
+          });
+        }
+      }
+
+      // ============================================================
+      // Entity creation/updates based on event type
+      // ============================================================
+
       // Handle run_created event: create the run entity atomically
       if (data.eventType === 'run_created') {
         const eventData = (data as any).eventData as {
@@ -335,7 +490,7 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
       }
 
       // Handle step_started event: increment attempt, set status to 'running'
-      // Sets startedAt (maps to firstStartedAt) only on first start
+      // Sets startedAt (maps to startedAt) only on first start
       if (data.eventType === 'step_started') {
         // First, get the current step to check attempt
         const [existingStep] = await drizzle
diff --git a/packages/world-postgres/test/storage.test.ts b/packages/world-postgres/test/storage.test.ts
index f35929181..3816212b8 100644
--- a/packages/world-postgres/test/storage.test.ts
+++ b/packages/world-postgres/test/storage.test.ts
@@ -378,7 +378,7 @@ describe('Storage (Postgres integration)', () => {
           output: undefined,
           error: undefined,
           attempt: 0, // steps are created with attempt 0
-          firstStartedAt: undefined,
+          startedAt: undefined,
           completedAt: undefined,
           createdAt: expect.any(Date),
           updatedAt: expect.any(Date),
@@ -435,7 +435,7 @@ describe('Storage (Postgres integration)', () => {
         );
 
         expect(updated.status).toBe('running');
-        expect(updated.firstStartedAt).toBeInstanceOf(Date);
+        expect(updated.startedAt).toBeInstanceOf(Date);
         expect(updated.attempt).toBe(1); // Incremented by step_started
       });
 
@@ -549,6 +549,13 @@ describe('Storage (Postgres integration)', () => {
 
     describe('create', () => {
       it('should create a new event', async () => {
+        // Create step before step_started event
+        await createStep(events, testRunId, {
+          stepId: 'corr_123',
+          stepName: 'test-step',
+          input: [],
+        });
+
         const eventData = {
           eventType: 'step_started' as const,
           correlationId: 'corr_123',
@@ -564,16 +571,27 @@ describe('Storage (Postgres integration)', () => {
       });
 
       it('should create a new event with null byte in payload', async () => {
+        // Create step before step_failed event
+        await createStep(events, testRunId, {
+          stepId: 'corr_123_null',
+          stepName: 'test-step-null',
+          input: [],
+        });
+        await events.create(testRunId, {
+          eventType: 'step_started',
+          correlationId: 'corr_123_null',
+        });
+
         const result = await events.create(testRunId, {
           eventType: 'step_failed',
-          correlationId: 'corr_123',
+          correlationId: 'corr_123_null',
           eventData: { error: 'Error with null byte \u0000 in message' },
         });
 
         expect(result.event.runId).toBe(testRunId);
         expect(result.event.eventId).toMatch(/^wevt_/);
         expect(result.event.eventType).toBe('step_failed');
-        expect(result.event.correlationId).toBe('corr_123');
+        expect(result.event.correlationId).toBe('corr_123_null');
         expect(result.event.createdAt).toBeInstanceOf(Date);
       });
 
@@ -598,6 +616,13 @@ describe('Storage (Postgres integration)', () => {
         // Small delay to ensure different timestamps in event IDs
         await new Promise((resolve) => setTimeout(resolve, 2));
 
+        // Create step before step_started event
+        await createStep(events, testRunId, {
+          stepId: 'corr-step-1',
+          stepName: 'test-step',
+          input: [],
+        });
+
         const result2 = await events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId: 'corr-step-1',
@@ -608,13 +633,13 @@ describe('Storage (Postgres integration)', () => {
           pagination: { sortOrder: 'asc' }, // Explicitly request ascending order
         });
 
-        // 3 events: run_created (from createRun), workflow_started, step_started
-        expect(result.data).toHaveLength(3);
+        // 4 events: run_created (from createRun), workflow_started, step_created, step_started
+        expect(result.data).toHaveLength(4);
         // Should be in chronological order (oldest first)
         expect(result.data[0].eventType).toBe('run_created');
         expect(result.data[1].eventId).toBe(result1.event.eventId);
-        expect(result.data[2].eventId).toBe(result2.event.eventId);
-        expect(result.data[2].createdAt.getTime()).toBeGreaterThanOrEqual(
+        expect(result.data[3].eventId).toBe(result2.event.eventId);
+        expect(result.data[3].createdAt.getTime()).toBeGreaterThanOrEqual(
           result.data[1].createdAt.getTime()
         );
       });
@@ -627,6 +652,13 @@ describe('Storage (Postgres integration)', () => {
         // Small delay to ensure different timestamps in event IDs
         await new Promise((resolve) => setTimeout(resolve, 2));
 
+        // Create step before step_started event
+        await createStep(events, testRunId, {
+          stepId: 'corr-step-1',
+          stepName: 'test-step',
+          input: [],
+        });
+
         const result2 = await events.create(testRunId, {
           eventType: 'step_started' as const,
           correlationId: 'corr-step-1',
@@ -637,20 +669,31 @@ describe('Storage (Postgres integration)', () => {
           pagination: { sortOrder: 'desc' },
         });
 
-        // 3 events: run_created (from createRun), workflow_started, step_started
-        expect(result.data).toHaveLength(3);
+        // 4 events: run_created (from createRun), workflow_started, step_created, step_started
+        expect(result.data).toHaveLength(4);
         // Should be in reverse chronological order (newest first)
         expect(result.data[0].eventId).toBe(result2.event.eventId);
-        expect(result.data[1].eventId).toBe(result1.event.eventId);
-        expect(result.data[2].eventType).toBe('run_created');
+        expect(result.data[1].eventType).toBe('step_created');
+        expect(result.data[2].eventId).toBe(result1.event.eventId);
+        expect(result.data[3].eventType).toBe('run_created');
         expect(result.data[0].createdAt.getTime()).toBeGreaterThanOrEqual(
-          result.data[1].createdAt.getTime()
+          result.data[2].createdAt.getTime()
         );
       });
 
       it('should support pagination', async () => {
-        // Create multiple events
+        // Create multiple events - must create steps first
         for (let i = 0; i < 5; i++) {
+          await createStep(events, testRunId, {
+            stepId: `corr_${i}`,
+            stepName: `test-step-${i}`,
+            input: [],
+          });
+          // Start the step before completing
+          await events.create(testRunId, {
+            eventType: 'step_started',
+            correlationId: `corr_${i}`,
+          });
           await events.create(testRunId, {
             eventType: 'step_completed',
             correlationId: `corr_${i}`,
@@ -680,6 +723,13 @@ describe('Storage (Postgres integration)', () => {
       it('should list all events with a specific correlation ID', async () => {
         const correlationId = 'step-abc123';
 
+        // Create step before step events
+        await createStep(events, testRunId, {
+          stepId: correlationId,
+          stepName: 'test-step',
+          input: [],
+        });
+
         // Create events with the target correlation ID
         const result1 = await events.create(testRunId, {
           eventType: 'step_started',
@@ -695,6 +745,11 @@ describe('Storage (Postgres integration)', () => {
         });
 
         // Create events with different correlation IDs (should be filtered out)
+        await createStep(events, testRunId, {
+          stepId: 'different-step',
+          stepName: 'different-step',
+          input: [],
+        });
         await events.create(testRunId, {
           eventType: 'step_started',
           correlationId: 'different-step',
@@ -708,11 +763,13 @@ describe('Storage (Postgres integration)', () => {
           pagination: {},
         });
 
-        expect(result.data).toHaveLength(2);
-        expect(result.data[0].eventId).toBe(result1.event.eventId);
-        expect(result.data[0].correlationId).toBe(correlationId);
-        expect(result.data[1].eventId).toBe(result2.event.eventId);
+        // 3 events: step_created, step_started, step_completed
+        expect(result.data).toHaveLength(3);
+        expect(result.data[0].eventType).toBe('step_created');
+        expect(result.data[1].eventId).toBe(result1.event.eventId);
         expect(result.data[1].correlationId).toBe(correlationId);
+        expect(result.data[2].eventId).toBe(result2.event.eventId);
+        expect(result.data[2].correlationId).toBe(correlationId);
       });
 
       it('should list events across multiple runs with same correlation ID', async () => {
@@ -762,6 +819,12 @@ describe('Storage (Postgres integration)', () => {
       });
 
       it('should return empty list for non-existent correlation ID', async () => {
+        // Create a step and start it
+        await createStep(events, testRunId, {
+          stepId: 'existing-step',
+          stepName: 'existing-step',
+          input: [],
+        });
         await events.create(testRunId, {
           eventType: 'step_started',
           correlationId: 'existing-step',
@@ -780,6 +843,13 @@ describe('Storage (Postgres integration)', () => {
       it('should respect pagination parameters', async () => {
         const correlationId = 'step_paginated';
 
+        // Create step first
+        await createStep(events, testRunId, {
+          stepId: correlationId,
+          stepName: 'test-step',
+          input: [],
+        });
+
         // Create multiple events
         await events.create(testRunId, {
           eventType: 'step_started',
@@ -791,7 +861,15 @@ describe('Storage (Postgres integration)', () => {
         await events.create(testRunId, {
           eventType: 'step_retrying',
           correlationId,
-          eventData: { attempt: 1 },
+          eventData: { error: 'retry error' },
+        });
+
+        await new Promise((resolve) => setTimeout(resolve, 2));
+
+        // Start again after retry
+        await events.create(testRunId, {
+          eventType: 'step_started',
+          correlationId,
         });
 
         await new Promise((resolve) => setTimeout(resolve, 2));
@@ -802,27 +880,38 @@ describe('Storage (Postgres integration)', () => {
           eventData: { result: 'success' },
         });
 
-        // Get first page
+        // Get first page (step_created, step_started, step_retrying)
         const page1 = await events.listByCorrelationId({
           correlationId,
-          pagination: { limit: 2 },
+          pagination: { limit: 3 },
         });
 
-        expect(page1.data).toHaveLength(2);
+        expect(page1.data).toHaveLength(3);
         expect(page1.hasMore).toBe(true);
         expect(page1.cursor).toBeDefined();
 
-        // Get second page
+        // Get second page (step_started, step_completed)
         const page2 = await events.listByCorrelationId({
           correlationId,
-          pagination: { limit: 2, cursor: page1.cursor || undefined },
+          pagination: { limit: 3, cursor: page1.cursor || undefined },
         });
 
-        expect(page2.data).toHaveLength(1);
+        expect(page2.data).toHaveLength(2);
         expect(page2.hasMore).toBe(false);
       });
 
       it('should always return full event data', async () => {
+        // Create step first
+        await createStep(events, testRunId, {
+          stepId: 'step-with-data',
+          stepName: 'step-with-data',
+          input: [],
+        });
+        // Start the step before completing
+        await events.create(testRunId, {
+          eventType: 'step_started',
+          correlationId: 'step-with-data',
+        });
         await events.create(testRunId, {
           eventType: 'step_completed',
           correlationId: 'step-with-data',
@@ -835,13 +924,21 @@ describe('Storage (Postgres integration)', () => {
           pagination: {},
         });
 
-        expect(result.data).toHaveLength(1);
-        expect(result.data[0].correlationId).toBe('step-with-data');
+        // 3 events: step_created, step_started, step_completed
+        expect(result.data).toHaveLength(3);
+        expect(result.data[2].correlationId).toBe('step-with-data');
       });
 
       it('should return events in ascending order by default', async () => {
         const correlationId = 'step-ordering';
 
+        // Create step first
+        await createStep(events, testRunId, {
+          stepId: correlationId,
+          stepName: 'test-step',
+          input: [],
+        });
+
         // Create events with slight delays to ensure different timestamps
         const result1 = await events.create(testRunId, {
           eventType: 'step_started',
@@ -861,17 +958,25 @@ describe('Storage (Postgres integration)', () => {
           pagination: {},
         });
 
-        expect(result.data).toHaveLength(2);
-        expect(result.data[0].eventId).toBe(result1.event.eventId);
-        expect(result.data[1].eventId).toBe(result2.event.eventId);
-        expect(result.data[0].createdAt.getTime()).toBeLessThanOrEqual(
-          result.data[1].createdAt.getTime()
+        // 3 events: step_created, step_started, step_completed
+        expect(result.data).toHaveLength(3);
+        expect(result.data[1].eventId).toBe(result1.event.eventId);
+        expect(result.data[2].eventId).toBe(result2.event.eventId);
+        expect(result.data[1].createdAt.getTime()).toBeLessThanOrEqual(
+          result.data[2].createdAt.getTime()
         );
       });
 
       it('should support descending order', async () => {
         const correlationId = 'step-desc-order';
 
+        // Create step first
+        await createStep(events, testRunId, {
+          stepId: correlationId,
+          stepName: 'test-step',
+          input: [],
+        });
+
         const result1 = await events.create(testRunId, {
           eventType: 'step_started',
           correlationId,
@@ -890,7 +995,8 @@ describe('Storage (Postgres integration)', () => {
           pagination: { sortOrder: 'desc' },
         });
 
-        expect(result.data).toHaveLength(2);
+        // 3 events in descending order: step_completed, step_started, step_created
+        expect(result.data).toHaveLength(3);
         expect(result.data[0].eventId).toBe(result2.event.eventId);
         expect(result.data[1].eventId).toBe(result1.event.eventId);
         expect(result.data[0].createdAt.getTime()).toBeGreaterThanOrEqual(
@@ -1342,7 +1448,7 @@ describe('Storage (Postgres integration)', () => {
       expect(result.status).toBe('failed');
     });
 
-    it('should allow hook_disposed on completed run', async () => {
+    it('should auto-delete hooks when run completes (postgres-specific behavior)', async () => {
       const run = await createRun(events, {
         deploymentId: 'deployment-123',
         workflowName: 'test-workflow',
@@ -1351,20 +1457,21 @@ describe('Storage (Postgres integration)', () => {
 
       // Create a hook
       await createHook(events, run.runId, {
-        hookId: 'hook_to_dispose',
+        hookId: 'hook_auto_deleted',
         token: 'test-token-dispose',
       });
 
-      // Complete the run
+      // Complete the run - this auto-deletes the hook
       await updateRun(events, run.runId, 'run_completed', { output: 'done' });
 
-      // Should succeed - disposing a hook on a terminal run is allowed
+      // The hook should no longer exist because run completion auto-deletes hooks
+      // This is intentional behavior to allow token reuse across runs
       await expect(
         events.create(run.runId, {
           eventType: 'hook_disposed',
-          correlationId: 'hook_to_dispose',
+          correlationId: 'hook_auto_deleted',
         })
-      ).resolves.not.toThrow();
+      ).rejects.toThrow(/not found/i);
     });
   });
 
diff --git a/packages/world-vercel/src/events.ts b/packages/world-vercel/src/events.ts
index 7d618b5f6..341b4e175 100644
--- a/packages/world-vercel/src/events.ts
+++ b/packages/world-vercel/src/events.ts
@@ -24,11 +24,10 @@ import {
 
 /**
  * Wire format schema for step in event results.
- * Maps server field names to Step interface field names.
+ * Handles error deserialization from wire format.
  */
 const StepWireSchema = StepSchema.omit({
   error: true,
-  firstStartedAt: true,
 }).extend({
   // Backend returns error either as:
   // - A JSON string (legacy/lazy mode)
@@ -44,19 +43,16 @@ const StepWireSchema = StepSchema.omit({
     ])
     .optional(),
   errorRef: z.any().optional(),
-  // Backend returns startedAt, which maps to firstStartedAt
-  startedAt: z.coerce.date().optional(),
 });
 
 /**
  * Deserialize step from wire format to Step interface format.
  */
 function deserializeStep(wireStep: z.infer<typeof StepWireSchema>): Step {
-  const { error, errorRef, startedAt, ...rest } = wireStep;
+  const { error, errorRef, ...rest } = wireStep;
 
   const result: any = {
     ...rest,
-    firstStartedAt: startedAt,
   };
 
   // Deserialize error to StructuredError
diff --git a/packages/world-vercel/src/steps.ts b/packages/world-vercel/src/steps.ts
index 10fa87d3d..de13e10f0 100644
--- a/packages/world-vercel/src/steps.ts
+++ b/packages/world-vercel/src/steps.ts
@@ -18,16 +18,10 @@ import {
 
 /**
  * Wire format schema for steps coming from the backend.
- * The backend returns:
- * - error/errorRef as a JSON string (maps to error in Step interface)
- * - startedAt (maps to firstStartedAt in Step interface)
- *
- * This is used for validation in makeRequest(), then deserializeStep()
- * transforms the wire format into the expected Step interface.
+ * Handles error deserialization from wire format.
  */
 const StepWireSchema = StepSchema.omit({
   error: true,
-  firstStartedAt: true,
 }).extend({
   // Backend returns error either as:
   // - A JSON string (legacy/lazy mode)
@@ -44,8 +38,6 @@ const StepWireSchema = StepSchema.omit({
     ])
     .optional(),
   errorRef: z.any().optional(),
-  // Backend returns startedAt, which maps to firstStartedAt
-  startedAt: z.coerce.date().optional(),
 });
 
 // Wire schema for lazy mode with refs instead of data
@@ -64,15 +56,12 @@ const StepWireWithRefsSchema = StepWireSchema.omit({
  * Transform step from wire format to Step interface format.
  * Maps:
  * - error/errorRef → error (deserializing JSON string to StructuredError)
- * - startedAt → firstStartedAt
  */
 function deserializeStep(wireStep: any): Step {
-  const { error, errorRef, startedAt, ...rest } = wireStep;
+  const { error, errorRef, ...rest } = wireStep;
 
-  // Map startedAt to firstStartedAt
   const result: any = {
     ...rest,
-    firstStartedAt: startedAt,
   };
 
   // Deserialize error to StructuredError
diff --git a/packages/world/src/steps.ts b/packages/world/src/steps.ts
index 56749fe4e..db1518c02 100644
--- a/packages/world/src/steps.ts
+++ b/packages/world/src/steps.ts
@@ -35,7 +35,7 @@ export const StepSchema = z.object({
    * When the step first started executing. Set by the first step_started event
    * and not updated on subsequent retries.
    */
-  firstStartedAt: z.coerce.date().optional(),
+  startedAt: z.coerce.date().optional(),
   completedAt: z.coerce.date().optional(),
   createdAt: z.coerce.date(),
   updatedAt: z.coerce.date(),

From 736cecdb92aa1e2eac84666de5417c3bc33b214c Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 19:57:34 -0800
Subject: [PATCH 18/27] Add step_retrying on terminal step tests
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Tests that step_retrying is rejected on:
- completed steps
- failed steps

Matches workflow-server's event-materialization tests.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-local/src/storage.test.ts     | 54 ++++++++++++++++++++
 packages/world-postgres/test/storage.test.ts | 54 ++++++++++++++++++++
 2 files changed, 108 insertions(+)

diff --git a/packages/world-local/src/storage.test.ts b/packages/world-local/src/storage.test.ts
index eff9dce40..da8067af0 100644
--- a/packages/world-local/src/storage.test.ts
+++ b/packages/world-local/src/storage.test.ts
@@ -1731,6 +1731,60 @@ describe('Storage', () => {
           })
         ).rejects.toThrow(/terminal/i);
       });
+
+      it('should reject step_retrying on failed step', async () => {
+        await createStep(storage, testRunId, {
+          stepId: 'step_failed_retry',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          storage,
+          testRunId,
+          'step_failed_retry',
+          'step_failed',
+          {
+            error: 'Failed permanently',
+          }
+        );
+
+        await expect(
+          updateStep(storage, testRunId, 'step_failed_retry', 'step_retrying', {
+            error: 'Retry attempt',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+
+    describe('step_retrying validation', () => {
+      it('should reject step_retrying on completed step', async () => {
+        await createStep(storage, testRunId, {
+          stepId: 'step_completed_retry',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          storage,
+          testRunId,
+          'step_completed_retry',
+          'step_completed',
+          {
+            result: 'done',
+          }
+        );
+
+        await expect(
+          updateStep(
+            storage,
+            testRunId,
+            'step_completed_retry',
+            'step_retrying',
+            {
+              error: 'Retry attempt',
+            }
+          )
+        ).rejects.toThrow(/terminal/i);
+      });
     });
   });
 
diff --git a/packages/world-postgres/test/storage.test.ts b/packages/world-postgres/test/storage.test.ts
index 3816212b8..7812205e1 100644
--- a/packages/world-postgres/test/storage.test.ts
+++ b/packages/world-postgres/test/storage.test.ts
@@ -1248,6 +1248,60 @@ describe('Storage (Postgres integration)', () => {
           })
         ).rejects.toThrow(/terminal/i);
       });
+
+      it('should reject step_retrying on failed step', async () => {
+        await createStep(events, testRunId, {
+          stepId: 'step_failed_retry',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          events,
+          testRunId,
+          'step_failed_retry',
+          'step_failed',
+          {
+            error: 'Failed permanently',
+          }
+        );
+
+        await expect(
+          updateStep(events, testRunId, 'step_failed_retry', 'step_retrying', {
+            error: 'Retry attempt',
+          })
+        ).rejects.toThrow(/terminal/i);
+      });
+    });
+
+    describe('step_retrying validation', () => {
+      it('should reject step_retrying on completed step', async () => {
+        await createStep(events, testRunId, {
+          stepId: 'step_completed_retry',
+          stepName: 'test-step',
+          input: [],
+        });
+        await updateStep(
+          events,
+          testRunId,
+          'step_completed_retry',
+          'step_completed',
+          {
+            result: 'done',
+          }
+        );
+
+        await expect(
+          updateStep(
+            events,
+            testRunId,
+            'step_completed_retry',
+            'step_retrying',
+            {
+              error: 'Retry attempt',
+            }
+          )
+        ).rejects.toThrow(/terminal/i);
+      });
     });
   });
 

From faecbea88c0ed2f50bead69d6ee0cc66a897f908 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 20:07:08 -0800
Subject: [PATCH 19/27] Fix performance regression: reuse validation reads
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The validation logic was causing redundant file/DB reads:
- For run events: read run for validation, then read again for update
- For step events: read step for validation, then read again for update

This fix reuses the validation reads:
- world-local: reuse currentRun and validatedStep in event handlers
- world-postgres: fetch startedAt in validation read, reuse for step_started

Before: 2-3 reads per event
After: 1 read per event

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-local/src/storage.ts    | 192 ++++++++++++++-----------
 packages/world-postgres/src/storage.ts |  33 ++---
 2 files changed, 120 insertions(+), 105 deletions(-)

diff --git a/packages/world-local/src/storage.ts b/packages/world-local/src/storage.ts
index 1df7f1e0e..10ced6df9 100644
--- a/packages/world-local/src/storage.ts
+++ b/packages/world-local/src/storage.ts
@@ -397,6 +397,8 @@ export function createStorage(basedir: string): Storage {
         }
 
         // Step-related event validation (ordering and terminal state)
+        // Store existingStep so we can reuse it later (avoid double read)
+        let validatedStep: Step | null = null;
         const stepEvents = [
           'step_started',
           'step_completed',
@@ -410,10 +412,10 @@ export function createStorage(basedir: string): Storage {
             'steps',
             `${stepCompositeKey}.json`
           );
-          const existingStep = await readJSON(stepPath, StepSchema);
+          validatedStep = await readJSON(stepPath, StepSchema);
 
           // Event ordering: step must exist before these events
-          if (!existingStep) {
+          if (!validatedStep) {
             throw new WorkflowAPIError(
               `Step "${data.correlationId}" not found`,
               { status: 404 }
@@ -421,16 +423,16 @@ export function createStorage(basedir: string): Storage {
           }
 
           // Step terminal state validation
-          if (isStepTerminal(existingStep.status)) {
+          if (isStepTerminal(validatedStep.status)) {
             throw new WorkflowAPIError(
-              `Cannot modify step in terminal state "${existingStep.status}"`,
+              `Cannot modify step in terminal state "${validatedStep.status}"`,
               { status: 409 }
             );
           }
 
           // On terminal runs: only allow completing/failing in-progress steps
           if (currentRun && isRunTerminal(currentRun.status)) {
-            if (existingStep.status !== 'running') {
+            if (validatedStep.status !== 'running') {
               throw new WorkflowAPIError(
                 `Cannot modify non-running step on run in terminal state "${currentRun.status}"`,
                 { status: 409 }
@@ -498,40 +500,48 @@ export function createStorage(basedir: string): Storage {
           const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
           await writeJSON(runPath, run);
         } else if (data.eventType === 'run_started') {
-          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
-          const existingRun = await readJSON(runPath, WorkflowRunSchema);
-          if (existingRun) {
+          // Reuse currentRun from validation (already read above)
+          if (currentRun) {
+            const runPath = path.join(
+              basedir,
+              'runs',
+              `${effectiveRunId}.json`
+            );
             run = {
-              runId: existingRun.runId,
-              deploymentId: existingRun.deploymentId,
-              workflowName: existingRun.workflowName,
-              executionContext: existingRun.executionContext,
-              input: existingRun.input,
-              createdAt: existingRun.createdAt,
-              expiredAt: existingRun.expiredAt,
+              runId: currentRun.runId,
+              deploymentId: currentRun.deploymentId,
+              workflowName: currentRun.workflowName,
+              executionContext: currentRun.executionContext,
+              input: currentRun.input,
+              createdAt: currentRun.createdAt,
+              expiredAt: currentRun.expiredAt,
               status: 'running',
               output: undefined,
               error: undefined,
               completedAt: undefined,
-              startedAt: existingRun.startedAt ?? now,
+              startedAt: currentRun.startedAt ?? now,
               updatedAt: now,
             };
             await writeJSON(runPath, run, { overwrite: true });
           }
         } else if (data.eventType === 'run_completed' && 'eventData' in data) {
           const completedData = data.eventData as { output?: any };
-          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
-          const existingRun = await readJSON(runPath, WorkflowRunSchema);
-          if (existingRun) {
+          // Reuse currentRun from validation (already read above)
+          if (currentRun) {
+            const runPath = path.join(
+              basedir,
+              'runs',
+              `${effectiveRunId}.json`
+            );
             run = {
-              runId: existingRun.runId,
-              deploymentId: existingRun.deploymentId,
-              workflowName: existingRun.workflowName,
-              executionContext: existingRun.executionContext,
-              input: existingRun.input,
-              createdAt: existingRun.createdAt,
-              expiredAt: existingRun.expiredAt,
-              startedAt: existingRun.startedAt,
+              runId: currentRun.runId,
+              deploymentId: currentRun.deploymentId,
+              workflowName: currentRun.workflowName,
+              executionContext: currentRun.executionContext,
+              input: currentRun.input,
+              createdAt: currentRun.createdAt,
+              expiredAt: currentRun.expiredAt,
+              startedAt: currentRun.startedAt,
               status: 'completed',
               output: completedData.output,
               error: undefined,
@@ -546,18 +556,22 @@ export function createStorage(basedir: string): Storage {
             error: any;
             errorCode?: string;
           };
-          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
-          const existingRun = await readJSON(runPath, WorkflowRunSchema);
-          if (existingRun) {
+          // Reuse currentRun from validation (already read above)
+          if (currentRun) {
+            const runPath = path.join(
+              basedir,
+              'runs',
+              `${effectiveRunId}.json`
+            );
             run = {
-              runId: existingRun.runId,
-              deploymentId: existingRun.deploymentId,
-              workflowName: existingRun.workflowName,
-              executionContext: existingRun.executionContext,
-              input: existingRun.input,
-              createdAt: existingRun.createdAt,
-              expiredAt: existingRun.expiredAt,
-              startedAt: existingRun.startedAt,
+              runId: currentRun.runId,
+              deploymentId: currentRun.deploymentId,
+              workflowName: currentRun.workflowName,
+              executionContext: currentRun.executionContext,
+              input: currentRun.input,
+              createdAt: currentRun.createdAt,
+              expiredAt: currentRun.expiredAt,
+              startedAt: currentRun.startedAt,
               status: 'failed',
               output: undefined,
               error: {
@@ -575,18 +589,22 @@ export function createStorage(basedir: string): Storage {
             await deleteAllHooksForRun(basedir, effectiveRunId);
           }
         } else if (data.eventType === 'run_cancelled') {
-          const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
-          const existingRun = await readJSON(runPath, WorkflowRunSchema);
-          if (existingRun) {
+          // Reuse currentRun from validation (already read above)
+          if (currentRun) {
+            const runPath = path.join(
+              basedir,
+              'runs',
+              `${effectiveRunId}.json`
+            );
             run = {
-              runId: existingRun.runId,
-              deploymentId: existingRun.deploymentId,
-              workflowName: existingRun.workflowName,
-              executionContext: existingRun.executionContext,
-              input: existingRun.input,
-              createdAt: existingRun.createdAt,
-              expiredAt: existingRun.expiredAt,
-              startedAt: existingRun.startedAt,
+              runId: currentRun.runId,
+              deploymentId: currentRun.deploymentId,
+              workflowName: currentRun.workflowName,
+              executionContext: currentRun.executionContext,
+              input: currentRun.input,
+              createdAt: currentRun.createdAt,
+              expiredAt: currentRun.expiredAt,
+              startedAt: currentRun.startedAt,
               status: 'cancelled',
               output: undefined,
               error: undefined,
@@ -630,38 +648,38 @@ export function createStorage(basedir: string): Storage {
         } else if (data.eventType === 'step_started') {
           // step_started: Increments attempt, sets status to 'running'
           // Sets startedAt only on the first start (not updated on retries)
-          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
-          const stepPath = path.join(
-            basedir,
-            'steps',
-            `${stepCompositeKey}.json`
-          );
-          const existingStep = await readJSON(stepPath, StepSchema);
-          if (existingStep) {
+          // Reuse validatedStep from validation (already read above)
+          if (validatedStep) {
+            const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+            const stepPath = path.join(
+              basedir,
+              'steps',
+              `${stepCompositeKey}.json`
+            );
             step = {
-              ...existingStep,
+              ...validatedStep,
               status: 'running',
               // Only set startedAt on the first start
-              startedAt: existingStep.startedAt ?? now,
+              startedAt: validatedStep.startedAt ?? now,
               // Increment attempt counter on every start
-              attempt: existingStep.attempt + 1,
+              attempt: validatedStep.attempt + 1,
               updatedAt: now,
             };
             await writeJSON(stepPath, step, { overwrite: true });
           }
         } else if (data.eventType === 'step_completed' && 'eventData' in data) {
           // step_completed: Terminal state with output
+          // Reuse validatedStep from validation (already read above)
           const completedData = data.eventData as { result: any };
-          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
-          const stepPath = path.join(
-            basedir,
-            'steps',
-            `${stepCompositeKey}.json`
-          );
-          const existingStep = await readJSON(stepPath, StepSchema);
-          if (existingStep) {
+          if (validatedStep) {
+            const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+            const stepPath = path.join(
+              basedir,
+              'steps',
+              `${stepCompositeKey}.json`
+            );
             step = {
-              ...existingStep,
+              ...validatedStep,
               status: 'completed',
               output: completedData.result,
               completedAt: now,
@@ -671,18 +689,18 @@ export function createStorage(basedir: string): Storage {
           }
         } else if (data.eventType === 'step_failed' && 'eventData' in data) {
           // step_failed: Terminal state with error
+          // Reuse validatedStep from validation (already read above)
           const failedData = data.eventData as {
             error: any;
             stack?: string;
           };
-          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
-          const stepPath = path.join(
-            basedir,
-            'steps',
-            `${stepCompositeKey}.json`
-          );
-          const existingStep = await readJSON(stepPath, StepSchema);
-          if (existingStep) {
+          if (validatedStep) {
+            const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+            const stepPath = path.join(
+              basedir,
+              'steps',
+              `${stepCompositeKey}.json`
+            );
             const error = {
               message:
                 typeof failedData.error === 'string'
@@ -691,7 +709,7 @@ export function createStorage(basedir: string): Storage {
               stack: failedData.stack,
             };
             step = {
-              ...existingStep,
+              ...validatedStep,
               status: 'failed',
               error,
               completedAt: now,
@@ -701,21 +719,21 @@ export function createStorage(basedir: string): Storage {
           }
         } else if (data.eventType === 'step_retrying' && 'eventData' in data) {
           // step_retrying: Sets status back to 'pending', records error
+          // Reuse validatedStep from validation (already read above)
           const retryData = data.eventData as {
             error: any;
             stack?: string;
             retryAfter?: Date;
           };
-          const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
-          const stepPath = path.join(
-            basedir,
-            'steps',
-            `${stepCompositeKey}.json`
-          );
-          const existingStep = await readJSON(stepPath, StepSchema);
-          if (existingStep) {
+          if (validatedStep) {
+            const stepCompositeKey = `${effectiveRunId}-${data.correlationId}`;
+            const stepPath = path.join(
+              basedir,
+              'steps',
+              `${stepCompositeKey}.json`
+            );
             step = {
-              ...existingStep,
+              ...validatedStep,
               status: 'pending',
               error: {
                 message:
diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index d6e526f1a..95198d7aa 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -279,6 +279,9 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
       }
 
       // Step-related event validation (ordering and terminal state)
+      // Fetch status + startedAt so we can reuse for step_started (avoid double read)
+      let validatedStep: { status: string; startedAt: Date | null } | null =
+        null;
       const stepEvents = [
         'step_started',
         'step_completed',
@@ -287,7 +290,10 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
       ];
       if (stepEvents.includes(data.eventType) && data.correlationId) {
         const [existingStep] = await drizzle
-          .select({ status: Schema.steps.status })
+          .select({
+            status: Schema.steps.status,
+            startedAt: Schema.steps.startedAt,
+          })
           .from(Schema.steps)
           .where(
             and(
@@ -297,24 +303,26 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
           )
           .limit(1);
 
+        validatedStep = existingStep ?? null;
+
         // Event ordering: step must exist before these events
-        if (!existingStep) {
+        if (!validatedStep) {
           throw new WorkflowAPIError(`Step "${data.correlationId}" not found`, {
             status: 404,
           });
         }
 
         // Step terminal state validation
-        if (isStepTerminal(existingStep.status)) {
+        if (isStepTerminal(validatedStep.status)) {
           throw new WorkflowAPIError(
-            `Cannot modify step in terminal state "${existingStep.status}"`,
+            `Cannot modify step in terminal state "${validatedStep.status}"`,
             { status: 409 }
           );
         }
 
         // On terminal runs: only allow completing/failing in-progress steps
         if (currentRun && isRunTerminal(currentRun.status)) {
-          if (existingStep.status !== 'running') {
+          if (validatedStep.status !== 'running') {
             throw new WorkflowAPIError(
               `Cannot modify non-running step on run in terminal state "${currentRun.status}"`,
               { status: 409 }
@@ -491,20 +499,9 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
 
       // Handle step_started event: increment attempt, set status to 'running'
       // Sets startedAt (maps to startedAt) only on first start
+      // Reuse validatedStep from validation (already read above)
       if (data.eventType === 'step_started') {
-        // First, get the current step to check attempt
-        const [existingStep] = await drizzle
-          .select()
-          .from(Schema.steps)
-          .where(
-            and(
-              eq(Schema.steps.runId, effectiveRunId),
-              eq(Schema.steps.stepId, data.correlationId!)
-            )
-          )
-          .limit(1);
-
-        const isFirstStart = !existingStep?.startedAt;
+        const isFirstStart = !validatedStep?.startedAt;
 
         const [stepValue] = await drizzle
           .update(Schema.steps)

From a4569e63f301c32147440f2cf49e2142ae823bee Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 20:39:28 -0800
Subject: [PATCH 20/27] Optimize events.create: skip redundant run validation
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Skip run validation reads for step_completed and step_retrying events
since they only operate on running steps, and running steps are always
allowed to modify regardless of run state. This saves 1-2 I/O operations
per step event.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-local/src/storage.ts    | 9 ++++++++-
 packages/world-postgres/src/storage.ts | 9 ++++++++-
 2 files changed, 16 insertions(+), 2 deletions(-)

diff --git a/packages/world-local/src/storage.ts b/packages/world-local/src/storage.ts
index 10ced6df9..1a2ead142 100644
--- a/packages/world-local/src/storage.ts
+++ b/packages/world-local/src/storage.ts
@@ -328,8 +328,15 @@ export function createStorage(basedir: string): Storage {
           ['completed', 'failed'].includes(status);
 
         // Get current run state for validation (if not creating a new run)
+        // Skip run validation for step_completed and step_retrying - they only operate
+        // on running steps, and running steps are always allowed to modify regardless
+        // of run state. This optimization saves filesystem reads per step event.
         let currentRun: WorkflowRun | null = null;
-        if (data.eventType !== 'run_created') {
+        const skipRunValidationEvents = ['step_completed', 'step_retrying'];
+        if (
+          data.eventType !== 'run_created' &&
+          !skipRunValidationEvents.includes(data.eventType)
+        ) {
           const runPath = path.join(basedir, 'runs', `${effectiveRunId}.json`);
           currentRun = await readJSON(runPath, WorkflowRunSchema);
         }
diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index 95198d7aa..5f959f62d 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -204,8 +204,15 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
       // ============================================================
 
       // Get current run state for validation (if not creating a new run)
+      // Skip run validation for step_completed and step_retrying - they only operate
+      // on running steps, and running steps are always allowed to modify regardless
+      // of run state. This optimization saves database queries per step event.
       let currentRun: { status: string } | null = null;
-      if (data.eventType !== 'run_created') {
+      const skipRunValidationEvents = ['step_completed', 'step_retrying'];
+      if (
+        data.eventType !== 'run_created' &&
+        !skipRunValidationEvents.includes(data.eventType)
+      ) {
         const [runValue] = await drizzle
           .select({ status: Schema.runs.status })
           .from(Schema.runs)

From c8b6af63862165d23879b766162a977e83e1ea73 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 21:15:46 -0800
Subject: [PATCH 21/27] Optimize postgres events.create with prepared
 statements and conditional updates
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Performance optimizations for world-postgres:
1. Add prepared statements for validation queries (run status, step validation, hook token)
2. Use conditional UPDATE for step_completed/step_failed (validation in WHERE clause)
3. Skip validation query on happy path - only fetch on error

This reduces queries per step from 10 to ~7 on the happy path:
- step_started: 4 queries (prepared run + step validation + update + event)
- step_completed: 2 queries (conditional update + event) vs 3 before
- step_failed: 2 queries (conditional update + event) vs 3 before

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-postgres/src/storage.ts | 131 ++++++++++++++++++-------
 1 file changed, 97 insertions(+), 34 deletions(-)

diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index 5f959f62d..81b2e256e 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -17,7 +17,7 @@ import {
   StepSchema,
   WorkflowRunSchema,
 } from '@workflow/world';
-import { and, desc, eq, gt, lt, sql } from 'drizzle-orm';
+import { and, desc, eq, gt, lt, notInArray, sql } from 'drizzle-orm';
 import { monotonicFactory } from 'ulid';
 import { type Drizzle, Schema } from './drizzle/index.js';
 import type { SerializedContent } from './drizzle/schema.js';
@@ -171,6 +171,36 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
   const ulid = monotonicFactory();
   const { events } = Schema;
 
+  // Prepared statements for validation queries (performance optimization)
+  const getRunStatus = drizzle
+    .select({ status: Schema.runs.status })
+    .from(Schema.runs)
+    .where(eq(Schema.runs.runId, sql.placeholder('runId')))
+    .limit(1)
+    .prepare('events_get_run_status');
+
+  const getStepForValidation = drizzle
+    .select({
+      status: Schema.steps.status,
+      startedAt: Schema.steps.startedAt,
+    })
+    .from(Schema.steps)
+    .where(
+      and(
+        eq(Schema.steps.runId, sql.placeholder('runId')),
+        eq(Schema.steps.stepId, sql.placeholder('stepId'))
+      )
+    )
+    .limit(1)
+    .prepare('events_get_step_for_validation');
+
+  const getHookByToken = drizzle
+    .select({ hookId: Schema.hooks.hookId })
+    .from(Schema.hooks)
+    .where(eq(Schema.hooks.token, sql.placeholder('token')))
+    .limit(1)
+    .prepare('events_get_hook_by_token');
+
   return {
     async create(runId, data, params): Promise<EventResult> {
       const eventId = `wevt_${ulid()}`;
@@ -213,11 +243,10 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
         data.eventType !== 'run_created' &&
         !skipRunValidationEvents.includes(data.eventType)
       ) {
-        const [runValue] = await drizzle
-          .select({ status: Schema.runs.status })
-          .from(Schema.runs)
-          .where(eq(Schema.runs.runId, effectiveRunId))
-          .limit(1);
+        // Use prepared statement for better performance
+        const [runValue] = await getRunStatus.execute({
+          runId: effectiveRunId,
+        });
         currentRun = runValue ?? null;
       }
 
@@ -287,28 +316,23 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
 
       // Step-related event validation (ordering and terminal state)
       // Fetch status + startedAt so we can reuse for step_started (avoid double read)
+      // Skip validation for step_completed/step_failed - use conditional UPDATE instead
       let validatedStep: { status: string; startedAt: Date | null } | null =
         null;
-      const stepEvents = [
-        'step_started',
+      const stepEventsNeedingValidation = ['step_started', 'step_retrying'];
+      const stepEventsUsingConditionalUpdate = [
         'step_completed',
         'step_failed',
-        'step_retrying',
       ];
-      if (stepEvents.includes(data.eventType) && data.correlationId) {
-        const [existingStep] = await drizzle
-          .select({
-            status: Schema.steps.status,
-            startedAt: Schema.steps.startedAt,
-          })
-          .from(Schema.steps)
-          .where(
-            and(
-              eq(Schema.steps.runId, effectiveRunId),
-              eq(Schema.steps.stepId, data.correlationId)
-            )
-          )
-          .limit(1);
+      if (
+        stepEventsNeedingValidation.includes(data.eventType) &&
+        data.correlationId
+      ) {
+        // Use prepared statement for better performance
+        const [existingStep] = await getStepForValidation.execute({
+          runId: effectiveRunId,
+          stepId: data.correlationId,
+        });
 
         validatedStep = existingStep ?? null;
 
@@ -532,6 +556,7 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
       }
 
       // Handle step_completed event: update step status
+      // Uses conditional UPDATE to skip validation query (performance optimization)
       if (data.eventType === 'step_completed') {
         const eventData = (data as any).eventData as { result?: any };
         const [stepValue] = await drizzle
@@ -544,16 +569,37 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
           .where(
             and(
               eq(Schema.steps.runId, effectiveRunId),
-              eq(Schema.steps.stepId, data.correlationId!)
+              eq(Schema.steps.stepId, data.correlationId!),
+              // Only update if not already in terminal state (validation in WHERE clause)
+              notInArray(Schema.steps.status, ['completed', 'failed'])
             )
           )
           .returning();
         if (stepValue) {
           step = deserializeStepError(compact(stepValue));
+        } else {
+          // Step not updated - check if it exists and why
+          const [existing] = await getStepForValidation.execute({
+            runId: effectiveRunId,
+            stepId: data.correlationId!,
+          });
+          if (!existing) {
+            throw new WorkflowAPIError(
+              `Step "${data.correlationId}" not found`,
+              { status: 404 }
+            );
+          }
+          if (['completed', 'failed'].includes(existing.status)) {
+            throw new WorkflowAPIError(
+              `Cannot modify step in terminal state "${existing.status}"`,
+              { status: 409 }
+            );
+          }
         }
       }
 
       // Handle step_failed event: terminal state with error
+      // Uses conditional UPDATE to skip validation query (performance optimization)
       if (data.eventType === 'step_failed') {
         const eventData = (data as any).eventData as {
           error?: any;
@@ -579,12 +625,32 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
           .where(
             and(
               eq(Schema.steps.runId, effectiveRunId),
-              eq(Schema.steps.stepId, data.correlationId!)
+              eq(Schema.steps.stepId, data.correlationId!),
+              // Only update if not already in terminal state (validation in WHERE clause)
+              notInArray(Schema.steps.status, ['completed', 'failed'])
             )
           )
           .returning();
         if (stepValue) {
           step = deserializeStepError(compact(stepValue));
+        } else {
+          // Step not updated - check if it exists and why
+          const [existing] = await getStepForValidation.execute({
+            runId: effectiveRunId,
+            stepId: data.correlationId!,
+          });
+          if (!existing) {
+            throw new WorkflowAPIError(
+              `Step "${data.correlationId}" not found`,
+              { status: 404 }
+            );
+          }
+          if (['completed', 'failed'].includes(existing.status)) {
+            throw new WorkflowAPIError(
+              `Cannot modify step in terminal state "${existing.status}"`,
+              { status: 409 }
+            );
+          }
         }
       }
 
@@ -625,21 +691,18 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
       }
 
       // Handle hook_created event: create hook entity
+      // Uses prepared statement for token uniqueness check (performance optimization)
       if (data.eventType === 'hook_created') {
         const eventData = (data as any).eventData as {
           token: string;
           metadata?: any;
         };
 
-        // Check for duplicate token before creating hook
-        // Token must be unique per tenant (ownerId, projectId, environment)
-        const existingHook = await drizzle
-          .select({ hookId: Schema.hooks.hookId })
-          .from(Schema.hooks)
-          .where(eq(Schema.hooks.token, eventData.token))
-          .limit(1);
-
-        if (existingHook.length > 0) {
+        // Check for duplicate token using prepared statement
+        const [existingHook] = await getHookByToken.execute({
+          token: eventData.token,
+        });
+        if (existingHook) {
           throw new WorkflowAPIError(
             `Hook with token ${eventData.token} already exists for this project`,
             { status: 409 }

From e4f7ca185f8d0b7f3cbb61d6b7a1c5c95134f922 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 22:01:23 -0800
Subject: [PATCH 22/27] Fix unused variable in postgres storage
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Remove stepEventsUsingConditionalUpdate variable that was declared
but never used (TypeScript strict mode error).

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-postgres/src/storage.ts | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/packages/world-postgres/src/storage.ts b/packages/world-postgres/src/storage.ts
index 81b2e256e..026e9e29c 100644
--- a/packages/world-postgres/src/storage.ts
+++ b/packages/world-postgres/src/storage.ts
@@ -320,10 +320,6 @@ export function createEventsStorage(drizzle: Drizzle): Storage['events'] {
       let validatedStep: { status: string; startedAt: Date | null } | null =
         null;
       const stepEventsNeedingValidation = ['step_started', 'step_retrying'];
-      const stepEventsUsingConditionalUpdate = [
-        'step_completed',
-        'step_failed',
-      ];
       if (
         stepEventsNeedingValidation.includes(data.eventType) &&
         data.correlationId

From 5d9512c3c42377337bae34cbfb258668829a8ae4 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 22:27:01 -0800
Subject: [PATCH 23/27] Add Event Sourcing documentation page
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- New docs page explaining the event sourcing architecture
- Entity lifecycle diagrams for runs, steps, hooks, and waits
- Event types reference tables
- Terminal states and atomicity guarantees documentation
- Added mermaid diagram style guide to docs README

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 docs/README.md                                |  63 +++++
 .../docs/how-it-works/event-sourcing.mdx      | 219 ++++++++++++++++++
 docs/content/docs/how-it-works/meta.json      |   3 +-
 3 files changed, 284 insertions(+), 1 deletion(-)
 create mode 100644 docs/content/docs/how-it-works/event-sourcing.mdx

diff --git a/docs/README.md b/docs/README.md
index 8269d622b..d4520e10a 100644
--- a/docs/README.md
+++ b/docs/README.md
@@ -1,3 +1,66 @@
 # Workflow DevKit Docs
 
 Check out the docs [here](https://useworkflow.dev/)
+
+## Mermaid Diagram Style Guide
+
+When adding diagrams to documentation, follow these conventions for consistency.
+
+### Diagram Type
+
+Use `flowchart TD` (top-down) or `flowchart LR` (left-right) for flow diagrams:
+
+```mermaid
+flowchart TD
+    A["Source Code"] --> B["Transform"]
+    B --> C["Output"]
+```
+
+### Node Syntax
+
+Use square brackets with double quotes for rectangular nodes:
+
+```
+A["Label Text"]           # Correct - rectangular node
+A[Label Text]             # Avoid - can cause parsing issues
+A(Label Text)             # Avoid - rounded node, inconsistent style
+```
+
+### Edge Labels
+
+Use the pipe syntax with double quotes for edge labels:
+
+```
+A -->|"label"| B          # Correct
+A --> B                   # Correct (no label)
+```
+
+### Highlighting Important Nodes
+
+Use the purple color scheme to highlight terminal states or key components:
+
+```
+style NodeId fill:#a78bfa,stroke:#8b5cf6,color:#000
+```
+
+Place all `style` declarations at the end of the diagram.
+
+### Complete Example
+
+```mermaid
+flowchart TD
+    A["(start)"] --> B["pending"]
+    B -->|"started"| C["running"]
+    C -->|"completed"| D["completed"]
+    C -->|"failed"| E["failed"]
+
+    style D fill:#a78bfa,stroke:#8b5cf6,color:#000
+    style E fill:#a78bfa,stroke:#8b5cf6,color:#000
+```
+
+### Guidelines
+
+- Keep diagrams simple and readable
+- Use meaningful node labels
+- Limit complexity - split into multiple diagrams if needed
+- Add a legend or callout explaining highlighted nodes when appropriate
diff --git a/docs/content/docs/how-it-works/event-sourcing.mdx b/docs/content/docs/how-it-works/event-sourcing.mdx
new file mode 100644
index 000000000..14b99bbad
--- /dev/null
+++ b/docs/content/docs/how-it-works/event-sourcing.mdx
@@ -0,0 +1,219 @@
+---
+title: Event Sourcing
+---
+
+<Callout>
+This guide explores how the Workflow DevKit uses event sourcing internally. Understanding these concepts is helpful for debugging and building observability tools, but is not required to use workflows. For getting started with workflows, see the [getting started](/docs/getting-started) guides for your framework.
+</Callout>
+
+The Workflow DevKit uses event sourcing to track all state changes in workflow executions. Every mutation creates an event that is persisted to the event log, and entity state is derived by replaying these events.
+
+This page explains the event sourcing model, entity lifecycles, and the atomicity guarantees that make durable execution reliable.
+
+## Event Sourcing Overview
+
+Event sourcing is a persistence pattern where state changes are stored as a sequence of events rather than by updating records in place. The current state of any entity is reconstructed by replaying its events from the beginning.
+
+**Benefits for durable workflows:**
+
+- **Complete audit trail**: Every state change is recorded with its timestamp and context
+- **Debugging**: Replay the exact sequence of events that led to any state
+- **Consistency**: Events provide a single source of truth for all entity state
+- **Recoverability**: State can be reconstructed from the event log after failures
+
+In the Workflow DevKit, four types of entities are managed through events:
+
+- **Runs**: Workflow execution instances
+- **Steps**: Individual atomic operations within a workflow
+- **Hooks**: Webhook endpoints that can receive external data
+- **Waits**: Sleep or delay operations
+
+## Entity Lifecycles
+
+Each entity type follows a specific lifecycle defined by the events that can affect it. Events transition entities between states, and certain states are terminal—once reached, no further transitions are possible.
+
+<Callout type="info">
+In the diagrams below, <span style={{color: '#8b5cf6', fontWeight: 'bold'}}>purple nodes</span> indicate terminal states that cannot be transitioned out of.
+</Callout>
+
+### Run Lifecycle
+
+A run represents a single execution of a workflow function. Runs begin in `pending` state when created, transition to `running` when execution starts, and end in one of three terminal states.
+
+```mermaid
+flowchart TD
+    A["(start)"] -->|"run_created"| B["pending"]
+    B -->|"run_started"| C["running"]
+    C -->|"run_completed"| D["completed"]
+    C -->|"run_failed"| E["failed"]
+    C -->|"run_cancelled"| F["cancelled"]
+    B -->|"run_cancelled"| F
+
+    style D fill:#a78bfa,stroke:#8b5cf6,color:#000
+    style E fill:#a78bfa,stroke:#8b5cf6,color:#000
+    style F fill:#a78bfa,stroke:#8b5cf6,color:#000
+```
+
+**Run states:**
+
+- `pending`: Created but not yet executing
+- `running`: Actively executing workflow code
+- `completed`: Finished successfully with an output value
+- `failed`: Terminated due to an unrecoverable error
+- `cancelled`: Explicitly cancelled by the user or system
+
+### Step Lifecycle
+
+A step represents a single invocation of a step function. Steps can retry on failure, either transitioning back to `pending` via `step_retrying` or being re-executed directly with another `step_started` event.
+
+```mermaid
+flowchart TD
+    A["(start)"] -->|"step_created"| B["pending"]
+    B -->|"step_started"| C["running"]
+    C -->|"step_completed"| D["completed"]
+    C -->|"step_failed"| E["failed"]
+    C -.->|"step_retrying"| B
+
+    style D fill:#a78bfa,stroke:#8b5cf6,color:#000
+    style E fill:#a78bfa,stroke:#8b5cf6,color:#000
+```
+
+**Step states:**
+
+- `pending`: Created but not yet executing, or waiting to retry
+- `running`: Actively executing step code
+- `completed`: Finished successfully with a result value
+- `failed`: Terminated after exhausting all retry attempts
+
+<Callout type="info">
+The `step_retrying` event is optional. Steps can retry without it - the retry mechanism works regardless of whether this event is emitted. You may see back-to-back `step_started` events in logs when a step retries after a timeout or when the error is not explicitly captured.
+</Callout>
+
+When present, the `step_retrying` event moves a step back to `pending` state and records the error that caused the retry. This provides two benefits:
+
+- **Cleaner observability**: The event log explicitly shows retry transitions rather than consecutive `step_started` events
+- **Error history**: The error that triggered the retry is preserved for debugging
+
+### Hook Lifecycle
+
+A hook represents a webhook endpoint created by [`createWebhook()`](/docs/api-reference/workflow/create-webhook). Hooks can receive multiple payloads while active and are disposed when no longer needed.
+
+```mermaid
+flowchart TD
+    A["(start)"] -->|"hook_created"| B["active"]
+    B -->|"hook_received"| B
+    B -->|"hook_disposed"| C["disposed"]
+
+    style C fill:#a78bfa,stroke:#8b5cf6,color:#000
+```
+
+**Hook states:**
+
+- `active`: Ready to receive webhook payloads
+- `disposed`: No longer accepting payloads, token released for reuse
+
+<Callout type="info">
+Hooks are automatically disposed when a workflow reaches a terminal state (`completed`, `failed`, or `cancelled`). The `hook_disposed` event is only needed for explicit disposal before workflow completion.
+</Callout>
+
+### Wait Lifecycle
+
+A wait represents a sleep operation created by [`sleep()`](/docs/api-reference/workflow/sleep). Waits are simple two-state entities that track when a delay period has elapsed.
+
+```mermaid
+flowchart TD
+    A["(start)"] -->|"wait_created"| B["waiting"]
+    B -->|"wait_completed"| C["completed"]
+
+    style C fill:#a78bfa,stroke:#8b5cf6,color:#000
+```
+
+**Wait states:**
+
+- `waiting`: Delay period has not yet elapsed
+- `completed`: Delay period has elapsed, workflow can resume
+
+## Event Types Reference
+
+Events are categorized by the entity type they affect. Each event contains metadata including a timestamp and a `correlationId` that links the event to a specific entity:
+
+- Step events use the `stepId` as the correlation ID
+- Hook events use the `hookId` as the correlation ID
+- Wait events use the `waitId` as the correlation ID
+- Run events do not require a correlation ID since the `runId` itself identifies the entity
+
+### Run Events
+
+| Event | Description |
+|-------|-------------|
+| `run_created` | Creates a new workflow run in `pending` state. Contains the workflow name, input arguments, and deployment context. |
+| `run_started` | Transitions the run to `running` state when execution begins. |
+| `run_completed` | Transitions the run to `completed` state with the workflow's return value. |
+| `run_failed` | Transitions the run to `failed` state with error details and optional error code. |
+| `run_cancelled` | Transitions the run to `cancelled` state. Can be triggered from `pending` or `running` states. |
+
+### Step Events
+
+| Event | Description |
+|-------|-------------|
+| `step_created` | Creates a new step in `pending` state. Contains the step name and serialized input arguments. |
+| `step_started` | Transitions the step to `running` state. Includes the current attempt number for retries. |
+| `step_completed` | Transitions the step to `completed` state with the step's return value. |
+| `step_failed` | Transitions the step to `failed` state with error details. The step will not be retried. |
+| `step_retrying` | (Optional) Transitions the step back to `pending` state for retry. Contains the error that caused the retry and optional delay before the next attempt. When not emitted, retries appear as consecutive `step_started` events. |
+
+### Hook Events
+
+| Event | Description |
+|-------|-------------|
+| `hook_created` | Creates a new hook in `active` state. Contains the webhook token and optional metadata. |
+| `hook_received` | Records that a payload was delivered to the hook. The hook remains `active` and can receive more payloads. |
+| `hook_disposed` | Transitions the hook to `disposed` state. The webhook token is released for reuse by future workflows. |
+
+### Wait Events
+
+| Event | Description |
+|-------|-------------|
+| `wait_created` | Creates a new wait in `waiting` state. Contains the timestamp when the wait should complete. |
+| `wait_completed` | Transitions the wait to `completed` state when the delay period has elapsed. |
+
+## Terminal States
+
+Terminal states represent the end of an entity's lifecycle. Once an entity reaches a terminal state, no further events can transition it to another state.
+
+**Run terminal states:**
+
+- `completed`: Workflow finished successfully
+- `failed`: Workflow encountered an unrecoverable error
+- `cancelled`: Workflow was explicitly cancelled
+
+**Step terminal states:**
+
+- `completed`: Step finished successfully
+- `failed`: Step failed after all retry attempts
+
+**Hook terminal states:**
+
+- `disposed`: Hook is no longer active
+
+**Wait terminal states:**
+
+- `completed`: Delay period has elapsed
+
+Attempting to create an event that would transition an entity out of a terminal state will result in an error. This prevents inconsistent state and ensures the integrity of the event log.
+
+## Event Correlation
+
+Events use a `correlationId` to link related events together. For step, hook, and wait events, the correlation ID identifies the specific entity instance:
+
+- Step events share the same `correlationId` (the step ID) across all events for that step execution
+- Hook events share the same `correlationId` (the hook ID) across all events for that hook
+- Wait events share the same `correlationId` (the wait ID) across creation and completion
+
+Run events do not require a correlation ID since the `runId` itself provides the correlation.
+
+This correlation enables:
+
+- Querying all events for a specific step, hook, or wait
+- Building timelines of entity lifecycle transitions
+- Debugging by tracing the complete history of any entity
diff --git a/docs/content/docs/how-it-works/meta.json b/docs/content/docs/how-it-works/meta.json
index 09d452d82..a69c654e4 100644
--- a/docs/content/docs/how-it-works/meta.json
+++ b/docs/content/docs/how-it-works/meta.json
@@ -3,7 +3,8 @@
   "pages": [
     "understanding-directives",
     "code-transform",
-    "framework-integrations"
+    "framework-integrations",
+    "event-sourcing"
   ],
   "defaultOpen": false
 }

From 09e07b7b9f537195f0cc14c395ba4b52b531a35d Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 22:49:17 -0800
Subject: [PATCH 24/27] Update world-vercel to use v2 API endpoints everywhere
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Migrate all remaining v1 endpoints to v2 for consistency:
- runs.ts: list, create, get, update, cancel
- events.ts: list by runId or correlationId
- steps.ts: list, create, update, get
- hooks.ts: list, get, create, getByToken, dispose
- streamer.ts: write, close, read, listByRunId

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 packages/world-vercel/src/events.ts   |  4 ++--
 packages/world-vercel/src/hooks.ts    | 10 +++++-----
 packages/world-vercel/src/runs.ts     | 10 +++++-----
 packages/world-vercel/src/steps.ts    | 10 +++++-----
 packages/world-vercel/src/streamer.ts |  6 +++---
 5 files changed, 20 insertions(+), 20 deletions(-)

diff --git a/packages/world-vercel/src/events.ts b/packages/world-vercel/src/events.ts
index 341b4e175..55ee5ac31 100644
--- a/packages/world-vercel/src/events.ts
+++ b/packages/world-vercel/src/events.ts
@@ -145,8 +145,8 @@ export async function getWorkflowRunEvents(
   const queryString = searchParams.toString();
   const query = queryString ? `?${queryString}` : '';
   const endpoint = correlationId
-    ? `/v1/events${query}`
-    : `/v1/runs/${runId}/events${query}`;
+    ? `/v2/events${query}`
+    : `/v2/runs/${runId}/events${query}`;
 
   const response = (await makeRequest({
     endpoint,
diff --git a/packages/world-vercel/src/hooks.ts b/packages/world-vercel/src/hooks.ts
index dd5b8190a..87aa7281b 100644
--- a/packages/world-vercel/src/hooks.ts
+++ b/packages/world-vercel/src/hooks.ts
@@ -52,7 +52,7 @@ export async function listHooks(
   if (runId) searchParams.set('runId', runId);
 
   const queryString = searchParams.toString();
-  const endpoint = `/v1/hooks${queryString ? `?${queryString}` : ''}`;
+  const endpoint = `/v2/hooks${queryString ? `?${queryString}` : ''}`;
 
   const response = (await makeRequest({
     endpoint,
@@ -75,7 +75,7 @@ export async function getHook(
   config?: APIConfig
 ): Promise<Hook> {
   const resolveData = params?.resolveData || 'all';
-  const endpoint = `/v1/hooks/${hookId}`;
+  const endpoint = `/v2/hooks/${hookId}`;
 
   const hook = await makeRequest({
     endpoint,
@@ -93,7 +93,7 @@ export async function createHook(
   config?: APIConfig
 ): Promise<Hook> {
   return makeRequest({
-    endpoint: `/v1/hooks/create`,
+    endpoint: `/v2/hooks/create`,
     options: {
       method: 'POST',
       body: JSON.stringify(
@@ -114,7 +114,7 @@ export async function getHookByToken(
   config?: APIConfig
 ): Promise<Hook> {
   return makeRequest({
-    endpoint: `/v1/hooks/by-token?token=${encodeURIComponent(token)}`,
+    endpoint: `/v2/hooks/by-token?token=${encodeURIComponent(token)}`,
     options: {
       method: 'GET',
     },
@@ -128,7 +128,7 @@ export async function disposeHook(
   config?: APIConfig
 ): Promise<Hook> {
   return makeRequest({
-    endpoint: `/v1/hooks/${hookId}`,
+    endpoint: `/v2/hooks/${hookId}`,
     options: { method: 'DELETE' },
     config,
     schema: HookSchema,
diff --git a/packages/world-vercel/src/runs.ts b/packages/world-vercel/src/runs.ts
index 6b624d739..93e13f945 100644
--- a/packages/world-vercel/src/runs.ts
+++ b/packages/world-vercel/src/runs.ts
@@ -97,7 +97,7 @@ export async function listWorkflowRuns(
   searchParams.set('remoteRefBehavior', remoteRefBehavior);
 
   const queryString = searchParams.toString();
-  const endpoint = `/v1/runs${queryString ? `?${queryString}` : ''}`;
+  const endpoint = `/v2/runs${queryString ? `?${queryString}` : ''}`;
 
   const response = (await makeRequest({
     endpoint,
@@ -121,7 +121,7 @@ export async function createWorkflowRun(
   config?: APIConfig
 ): Promise<WorkflowRun> {
   const run = await makeRequest({
-    endpoint: '/v1/runs/create',
+    endpoint: '/v2/runs/create',
     options: {
       method: 'POST',
       body: JSON.stringify(data, dateToStringReplacer),
@@ -144,7 +144,7 @@ export async function getWorkflowRun(
   searchParams.set('remoteRefBehavior', remoteRefBehavior);
 
   const queryString = searchParams.toString();
-  const endpoint = `/v1/runs/${id}${queryString ? `?${queryString}` : ''}`;
+  const endpoint = `/v2/runs/${id}${queryString ? `?${queryString}` : ''}`;
 
   try {
     const run = await makeRequest({
@@ -173,7 +173,7 @@ export async function updateWorkflowRun(
   try {
     const serialized = serializeError(data);
     const run = await makeRequest({
-      endpoint: `/v1/runs/${id}`,
+      endpoint: `/v2/runs/${id}`,
       options: {
         method: 'PUT',
         body: JSON.stringify(serialized, dateToStringReplacer),
@@ -202,7 +202,7 @@ export async function cancelWorkflowRun(
   searchParams.set('remoteRefBehavior', remoteRefBehavior);
 
   const queryString = searchParams.toString();
-  const endpoint = `/v1/runs/${id}/cancel${queryString ? `?${queryString}` : ''}`;
+  const endpoint = `/v2/runs/${id}/cancel${queryString ? `?${queryString}` : ''}`;
 
   try {
     const run = await makeRequest({
diff --git a/packages/world-vercel/src/steps.ts b/packages/world-vercel/src/steps.ts
index de13e10f0..f97014567 100644
--- a/packages/world-vercel/src/steps.ts
+++ b/packages/world-vercel/src/steps.ts
@@ -137,7 +137,7 @@ export async function listWorkflowRunSteps(
   searchParams.set('remoteRefBehavior', remoteRefBehavior);
 
   const queryString = searchParams.toString();
-  const endpoint = `/v1/runs/${runId}/steps${queryString ? `?${queryString}` : ''}`;
+  const endpoint = `/v2/runs/${runId}/steps${queryString ? `?${queryString}` : ''}`;
 
   const response = (await makeRequest({
     endpoint,
@@ -160,7 +160,7 @@ export async function createStep(
   config?: APIConfig
 ): Promise<Step> {
   const step = await makeRequest({
-    endpoint: `/v1/runs/${runId}/steps`,
+    endpoint: `/v2/runs/${runId}/steps`,
     options: {
       method: 'POST',
       body: JSON.stringify(data, dateToStringReplacer),
@@ -184,7 +184,7 @@ export async function updateStep(
     wireData.error = JSON.stringify(stepError);
   }
   const step = await makeRequest({
-    endpoint: `/v1/runs/${runId}/steps/${stepId}`,
+    endpoint: `/v2/runs/${runId}/steps/${stepId}`,
     options: {
       method: 'PUT',
       body: JSON.stringify(wireData, dateToStringReplacer),
@@ -209,8 +209,8 @@ export async function getStep(
 
   const queryString = searchParams.toString();
   const endpoint = runId
-    ? `/v1/runs/${runId}/steps/${stepId}${queryString ? `?${queryString}` : ''}`
-    : `/v1/steps/${stepId}${queryString ? `?${queryString}` : ''}`;
+    ? `/v2/runs/${runId}/steps/${stepId}${queryString ? `?${queryString}` : ''}`
+    : `/v2/steps/${stepId}${queryString ? `?${queryString}` : ''}`;
 
   const step = await makeRequest({
     endpoint,
diff --git a/packages/world-vercel/src/streamer.ts b/packages/world-vercel/src/streamer.ts
index 24e1b00ac..017b3eaed 100644
--- a/packages/world-vercel/src/streamer.ts
+++ b/packages/world-vercel/src/streamer.ts
@@ -8,10 +8,10 @@ function getStreamUrl(
 ) {
   if (runId) {
     return new URL(
-      `${httpConfig.baseUrl}/v1/runs/${runId}/stream/${encodeURIComponent(name)}`
+      `${httpConfig.baseUrl}/v2/runs/${runId}/stream/${encodeURIComponent(name)}`
     );
   }
-  return new URL(`${httpConfig.baseUrl}/v1/stream/${encodeURIComponent(name)}`);
+  return new URL(`${httpConfig.baseUrl}/v2/stream/${encodeURIComponent(name)}`);
 }
 
 export function createStreamer(config?: APIConfig): Streamer {
@@ -58,7 +58,7 @@ export function createStreamer(config?: APIConfig): Streamer {
 
     async listStreamsByRunId(runId: string) {
       const httpConfig = await getHttpConfig(config);
-      const url = new URL(`${httpConfig.baseUrl}/v1/runs/${runId}/streams`);
+      const url = new URL(`${httpConfig.baseUrl}/v2/runs/${runId}/streams`);
       const res = await fetch(url, { headers: httpConfig.headers });
       if (!res.ok) throw new Error(`Failed to list streams: ${res.status}`);
       return (await res.json()) as string[];

From aead729e3c53d076a954bfc4220f59aa84974bbb Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 23:49:26 -0800
Subject: [PATCH 25/27] Improve event sourcing documentation accuracy and
 cross-linking
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Technical accuracy improvements:
- Clarify that hook states are conceptual (hooks are deleted, not transitioned)
- Add note about step cancelled status being reserved for future use
- Clarify that waits are conceptual entities not materialized in storage
- Fix run_created event description (deployment ID, execution context)
- Remove atomicity mention from intro (no longer accurate)
- Add hook token reservation explanation and link to hooks docs

Cross-linking improvements:
- Link "event log" mentions to event sourcing page from:
  - workflows-and-steps.mdx (3 locations)
  - understanding-directives.mdx
  - code-transform.mdx (2 locations)
  - streaming.mdx (2 locations)
  - worlds/index.mdx
  - observability/index.mdx
- Add outbound link to errors-and-retries from step retrying section

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 docs/content/docs/foundations/streaming.mdx   |  4 +-
 .../docs/foundations/workflows-and-steps.mdx  |  6 +--
 .../docs/how-it-works/code-transform.mdx      |  4 +-
 .../docs/how-it-works/event-sourcing.mdx      | 39 +++++++++++--------
 .../how-it-works/understanding-directives.mdx |  2 +-
 docs/content/docs/observability/index.mdx     |  2 +-
 docs/content/docs/worlds/index.mdx            |  2 +-
 7 files changed, 33 insertions(+), 26 deletions(-)

diff --git a/docs/content/docs/foundations/streaming.mdx b/docs/content/docs/foundations/streaming.mdx
index fdb684708..844f99779 100644
--- a/docs/content/docs/foundations/streaming.mdx
+++ b/docs/content/docs/foundations/streaming.mdx
@@ -83,7 +83,7 @@ This allows clients to reconnect and continue receiving data from where they lef
 
 [`ReadableStream`](https://developer.mozilla.org/en-US/docs/Web/API/ReadableStream) and [`WritableStream`](https://developer.mozilla.org/en-US/docs/Web/API/WritableStream) are standard Web Streams API types that Workflow DevKit makes serializable. These are not custom types - they follow the web standard - but Workflow DevKit adds the ability to pass them between functions while maintaining their streaming capabilities.
 
-Unlike regular values that are fully serialized to the event log, streams maintain their streaming capabilities when passed between functions.
+Unlike regular values that are fully serialized to the [event log](/docs/how-it-works/event-sourcing), streams maintain their streaming capabilities when passed between functions.
 
 **Key properties:**
 - Stream references can be passed between workflow and step functions
@@ -151,7 +151,7 @@ async function processInputStream(input: ReadableStream<Uint8Array>) {
 You cannot read from or write to streams directly within a workflow function. All stream operations must happen in step functions.
 </Callout>
 
-Workflow functions must be deterministic to support replay. Since streams bypass the event log for performance, reading stream data in a workflow would break determinism - each replay could see different data. By requiring all stream operations to happen in steps, the framework ensures consistent behavior.
+Workflow functions must be deterministic to support replay. Since streams bypass the [event log](/docs/how-it-works/event-sourcing) for performance, reading stream data in a workflow would break determinism - each replay could see different data. By requiring all stream operations to happen in steps, the framework ensures consistent behavior.
 
 For more on determinism and replay, see [Workflows and Steps](/docs/foundations/workflows-and-steps).
 
diff --git a/docs/content/docs/foundations/workflows-and-steps.mdx b/docs/content/docs/foundations/workflows-and-steps.mdx
index 15537d13e..3b2909bdd 100644
--- a/docs/content/docs/foundations/workflows-and-steps.mdx
+++ b/docs/content/docs/foundations/workflows-and-steps.mdx
@@ -36,10 +36,10 @@ export async function processOrderWorkflow(orderId: string) {
 **Key Characteristics:**
 
 - Runs in a sandboxed environment without full Node.js access
-- All step results are persisted to the event log
+- All step results are persisted to the [event log](/docs/how-it-works/event-sourcing)
 - Must be **deterministic** to allow resuming after failures
 
-Determinism in the workflow is required to resume the workflow from a suspension. Essentially, the workflow code gets re-run multiple times during its lifecycle, each time using an event log to resume the workflow to the correct spot.
+Determinism in the workflow is required to resume the workflow from a suspension. Essentially, the workflow code gets re-run multiple times during its lifecycle, each time using the [event log](/docs/how-it-works/event-sourcing) to resume the workflow to the correct spot.
 
 The sandboxed environment that workflows run in already ensures determinism. For instance, `Math.random` and `Date` constructors are fixed in workflow runs, so you are safe to use them, and the framework ensures that the values don't change across replays.
 
@@ -111,7 +111,7 @@ Keep in mind that calling a step function outside of a workflow function will no
 
 ### Suspension and Resumption
 
-Workflow functions have the ability to automatically suspend while they wait on asynchronous work. While suspended, the workflow's state is stored via the event log and no compute resources are used until the workflow resumes execution.
+Workflow functions have the ability to automatically suspend while they wait on asynchronous work. While suspended, the workflow's state is stored via the [event log](/docs/how-it-works/event-sourcing) and no compute resources are used until the workflow resumes execution.
 
 There are multiple ways a workflow can suspend:
 
diff --git a/docs/content/docs/how-it-works/code-transform.mdx b/docs/content/docs/how-it-works/code-transform.mdx
index 1b13797c5..396a2acab 100644
--- a/docs/content/docs/how-it-works/code-transform.mdx
+++ b/docs/content/docs/how-it-works/code-transform.mdx
@@ -140,7 +140,7 @@ handleUserSignup.workflowId = "workflow//workflows/user.js//handleUserSignup"; /
 - The workflow function gets a `workflowId` property for runtime identification
 - The `"use workflow"` directive is removed
 
-**Why this transformation?** When a workflow executes, it needs to replay past steps from the event log rather than re-executing them. The `WORKFLOW_USE_STEP` symbol is a special runtime hook that:
+**Why this transformation?** When a workflow executes, it needs to replay past steps from the [event log](/docs/how-it-works/event-sourcing) rather than re-executing them. The `WORKFLOW_USE_STEP` symbol is a special runtime hook that:
 
 1. Checks if the step has already been executed (in the event log)
 2. If yes: Returns the cached result
@@ -283,7 +283,7 @@ Because workflow functions are deterministic and have no side effects, they can
 
 - Can make API calls, database queries, etc.
 - Have full access to Node.js runtime and APIs
-- Results are cached in the event log after first execution
+- Results are cached in the [event log](/docs/how-it-works/event-sourcing) after first execution
 
 Learn more about [Workflows and Steps](/docs/foundations/workflows-and-steps).
 
diff --git a/docs/content/docs/how-it-works/event-sourcing.mdx b/docs/content/docs/how-it-works/event-sourcing.mdx
index 14b99bbad..820ba8df3 100644
--- a/docs/content/docs/how-it-works/event-sourcing.mdx
+++ b/docs/content/docs/how-it-works/event-sourcing.mdx
@@ -8,7 +8,7 @@ This guide explores how the Workflow DevKit uses event sourcing internally. Unde
 
 The Workflow DevKit uses event sourcing to track all state changes in workflow executions. Every mutation creates an event that is persisted to the event log, and entity state is derived by replaying these events.
 
-This page explains the event sourcing model, entity lifecycles, and the atomicity guarantees that make durable execution reliable.
+This page explains the event sourcing model and entity lifecycles.
 
 ## Event Sourcing Overview
 
@@ -21,12 +21,12 @@ Event sourcing is a persistence pattern where state changes are stored as a sequ
 - **Consistency**: Events provide a single source of truth for all entity state
 - **Recoverability**: State can be reconstructed from the event log after failures
 
-In the Workflow DevKit, four types of entities are managed through events:
+In the Workflow DevKit, the following entity types are managed through events:
 
-- **Runs**: Workflow execution instances
-- **Steps**: Individual atomic operations within a workflow
-- **Hooks**: Webhook endpoints that can receive external data
-- **Waits**: Sleep or delay operations
+- **Runs**: Workflow execution instances (materialized in storage)
+- **Steps**: Individual atomic operations within a workflow (materialized in storage)
+- **Hooks**: Webhook endpoints that can receive external data (materialized in storage)
+- **Waits**: Sleep or delay operations (tracked via events only, not materialized)
 
 ## Entity Lifecycles
 
@@ -84,9 +84,10 @@ flowchart TD
 - `running`: Actively executing step code
 - `completed`: Finished successfully with a result value
 - `failed`: Terminated after exhausting all retry attempts
+- `cancelled`: Reserved for future use (not currently emitted)
 
 <Callout type="info">
-The `step_retrying` event is optional. Steps can retry without it - the retry mechanism works regardless of whether this event is emitted. You may see back-to-back `step_started` events in logs when a step retries after a timeout or when the error is not explicitly captured.
+The `step_retrying` event is optional. Steps can retry without it - the retry mechanism works regardless of whether this event is emitted. You may see back-to-back `step_started` events in logs when a step retries after a timeout or when the error is not explicitly captured. See [Errors and Retries](/docs/foundations/errors-and-retries) for more on how retries work.
 </Callout>
 
 When present, the `step_retrying` event moves a step back to `pending` state and records the error that caused the retry. This provides two benefits:
@@ -109,16 +110,18 @@ flowchart TD
 
 **Hook states:**
 
-- `active`: Ready to receive webhook payloads
-- `disposed`: No longer accepting payloads, token released for reuse
+- `active`: Ready to receive webhook payloads (hook exists in storage)
+- `disposed`: No longer accepting payloads (hook is deleted from storage)
 
-<Callout type="info">
-Hooks are automatically disposed when a workflow reaches a terminal state (`completed`, `failed`, or `cancelled`). The `hook_disposed` event is only needed for explicit disposal before workflow completion.
-</Callout>
+Unlike other entities, hooks don't have a `status` field—the states above are conceptual. An "active" hook is one that exists in storage, while "disposed" means the hook has been deleted. When a `hook_disposed` event is created, the hook record is removed rather than updated.
+
+While a hook is active, its token is reserved and cannot be used by other workflows. This prevents token reuse conflicts across concurrent workflows. When a hook is disposed (either explicitly or when its workflow completes), the token is released and can be claimed by future workflows. Hooks are automatically disposed when a workflow reaches a terminal state (`completed`, `failed`, or `cancelled`). The `hook_disposed` event is only needed for explicit disposal before workflow completion.
+
+See [Hooks](/docs/foundations/hooks) for more on how webhooks work.
 
 ### Wait Lifecycle
 
-A wait represents a sleep operation created by [`sleep()`](/docs/api-reference/workflow/sleep). Waits are simple two-state entities that track when a delay period has elapsed.
+A wait represents a sleep operation created by [`sleep()`](/docs/api-reference/workflow/sleep). Waits track when a delay period has elapsed.
 
 ```mermaid
 flowchart TD
@@ -133,6 +136,10 @@ flowchart TD
 - `waiting`: Delay period has not yet elapsed
 - `completed`: Delay period has elapsed, workflow can resume
 
+<Callout type="info">
+Unlike Runs, Steps, and Hooks, waits are conceptual entities tracked only through events. There is no separate "Wait" record in storage that can be queried—the wait state is derived entirely from the `wait_created` and `wait_completed` events in the event log.
+</Callout>
+
 ## Event Types Reference
 
 Events are categorized by the entity type they affect. Each event contains metadata including a timestamp and a `correlationId` that links the event to a specific entity:
@@ -146,7 +153,7 @@ Events are categorized by the entity type they affect. Each event contains metad
 
 | Event | Description |
 |-------|-------------|
-| `run_created` | Creates a new workflow run in `pending` state. Contains the workflow name, input arguments, and deployment context. |
+| `run_created` | Creates a new workflow run in `pending` state. Contains the deployment ID, workflow name, input arguments, and optional execution context. |
 | `run_started` | Transitions the run to `running` state when execution begins. |
 | `run_completed` | Transitions the run to `completed` state with the workflow's return value. |
 | `run_failed` | Transitions the run to `failed` state with error details and optional error code. |
@@ -168,7 +175,7 @@ Events are categorized by the entity type they affect. Each event contains metad
 |-------|-------------|
 | `hook_created` | Creates a new hook in `active` state. Contains the webhook token and optional metadata. |
 | `hook_received` | Records that a payload was delivered to the hook. The hook remains `active` and can receive more payloads. |
-| `hook_disposed` | Transitions the hook to `disposed` state. The webhook token is released for reuse by future workflows. |
+| `hook_disposed` | Deletes the hook from storage (conceptually transitioning to `disposed` state). The webhook token is released for reuse by future workflows. |
 
 ### Wait Events
 
@@ -194,7 +201,7 @@ Terminal states represent the end of an entity's lifecycle. Once an entity reach
 
 **Hook terminal states:**
 
-- `disposed`: Hook is no longer active
+- `disposed`: Hook has been deleted from storage and is no longer active
 
 **Wait terminal states:**
 
diff --git a/docs/content/docs/how-it-works/understanding-directives.mdx b/docs/content/docs/how-it-works/understanding-directives.mdx
index 5f2787459..d543b793c 100644
--- a/docs/content/docs/how-it-works/understanding-directives.mdx
+++ b/docs/content/docs/how-it-works/understanding-directives.mdx
@@ -47,7 +47,7 @@ export async function onboardUser(userId: string) {
 }
 ```
 
-**The key insight:** Workflows resume from suspension by replaying their code using cached step results from the event log. When a step like `await fetchUserData(userId)` is called:
+**The key insight:** Workflows resume from suspension by replaying their code using cached step results from the [event log](/docs/how-it-works/event-sourcing). When a step like `await fetchUserData(userId)` is called:
 
 - **If already executed:** Returns the cached result immediately from the event log
 - **If not yet executed:** Suspends the workflow, enqueues the step for background execution, and resumes later with the result
diff --git a/docs/content/docs/observability/index.mdx b/docs/content/docs/observability/index.mdx
index 4daf9b867..841a8edef 100644
--- a/docs/content/docs/observability/index.mdx
+++ b/docs/content/docs/observability/index.mdx
@@ -2,7 +2,7 @@
 title: Observability
 ---
 
-Workflow DevKit provides powerful tools to inspect, monitor, and debug your workflows through the CLI and Web UI. These tools allow you to inspect workflow runs, steps, webhooks, events, and stream output.
+Workflow DevKit provides powerful tools to inspect, monitor, and debug your workflows through the CLI and Web UI. These tools allow you to inspect workflow runs, steps, webhooks, [events](/docs/how-it-works/event-sourcing), and stream output.
 
 ## Quick Start
 
diff --git a/docs/content/docs/worlds/index.mdx b/docs/content/docs/worlds/index.mdx
index 67c4d7c7e..5549ae93d 100644
--- a/docs/content/docs/worlds/index.mdx
+++ b/docs/content/docs/worlds/index.mdx
@@ -14,7 +14,7 @@ The Workflow `World` is an interface that abstracts how workflows and steps comm
 ## What is a World?
 
 A World implementation handles:
-- **Workflow Storage**: Persisting workflow state and event logs
+- **Workflow Storage**: Persisting workflow state and [event logs](/docs/how-it-works/event-sourcing)
 - **Step Execution**: Managing step function invocations
 - **Message Passing**: Communication between workflow orchestrator and step functions
 

From d1c485acaa151cea3aa4285ad791df16521128e3 Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 23:50:44 -0800
Subject: [PATCH 26/27] Fix hook documentation to describe general hook
 primitive
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Hooks are the general primitive for pausing workflows and receiving
external data. Webhooks are a specific HTTP-based abstraction built
on top of hooks. Updated documentation to reflect this distinction.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 docs/content/docs/how-it-works/event-sourcing.mdx | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/docs/content/docs/how-it-works/event-sourcing.mdx b/docs/content/docs/how-it-works/event-sourcing.mdx
index 820ba8df3..a4a5d80af 100644
--- a/docs/content/docs/how-it-works/event-sourcing.mdx
+++ b/docs/content/docs/how-it-works/event-sourcing.mdx
@@ -25,7 +25,7 @@ In the Workflow DevKit, the following entity types are managed through events:
 
 - **Runs**: Workflow execution instances (materialized in storage)
 - **Steps**: Individual atomic operations within a workflow (materialized in storage)
-- **Hooks**: Webhook endpoints that can receive external data (materialized in storage)
+- **Hooks**: Suspension points that can receive external data (materialized in storage)
 - **Waits**: Sleep or delay operations (tracked via events only, not materialized)
 
 ## Entity Lifecycles
@@ -97,7 +97,9 @@ When present, the `step_retrying` event moves a step back to `pending` state and
 
 ### Hook Lifecycle
 
-A hook represents a webhook endpoint created by [`createWebhook()`](/docs/api-reference/workflow/create-webhook). Hooks can receive multiple payloads while active and are disposed when no longer needed.
+A hook represents a suspension point that can receive external data, created by [`createHook()`](/docs/api-reference/workflow/create-hook). Hooks enable workflows to pause and wait for external events, user interactions, or HTTP requests. Webhooks (created with [`createWebhook()`](/docs/api-reference/workflow/create-webhook)) are a higher-level abstraction built on hooks that adds automatic HTTP request/response handling.
+
+Hooks can receive multiple payloads while active and are disposed when no longer needed.
 
 ```mermaid
 flowchart TD
@@ -110,14 +112,14 @@ flowchart TD
 
 **Hook states:**
 
-- `active`: Ready to receive webhook payloads (hook exists in storage)
+- `active`: Ready to receive payloads (hook exists in storage)
 - `disposed`: No longer accepting payloads (hook is deleted from storage)
 
 Unlike other entities, hooks don't have a `status` field—the states above are conceptual. An "active" hook is one that exists in storage, while "disposed" means the hook has been deleted. When a `hook_disposed` event is created, the hook record is removed rather than updated.
 
 While a hook is active, its token is reserved and cannot be used by other workflows. This prevents token reuse conflicts across concurrent workflows. When a hook is disposed (either explicitly or when its workflow completes), the token is released and can be claimed by future workflows. Hooks are automatically disposed when a workflow reaches a terminal state (`completed`, `failed`, or `cancelled`). The `hook_disposed` event is only needed for explicit disposal before workflow completion.
 
-See [Hooks](/docs/foundations/hooks) for more on how webhooks work.
+See [Hooks & Webhooks](/docs/foundations/hooks) for more on how hooks and webhooks work.
 
 ### Wait Lifecycle
 
@@ -173,9 +175,9 @@ Events are categorized by the entity type they affect. Each event contains metad
 
 | Event | Description |
 |-------|-------------|
-| `hook_created` | Creates a new hook in `active` state. Contains the webhook token and optional metadata. |
+| `hook_created` | Creates a new hook in `active` state. Contains the hook token and optional metadata. |
 | `hook_received` | Records that a payload was delivered to the hook. The hook remains `active` and can receive more payloads. |
-| `hook_disposed` | Deletes the hook from storage (conceptually transitioning to `disposed` state). The webhook token is released for reuse by future workflows. |
+| `hook_disposed` | Deletes the hook from storage (conceptually transitioning to `disposed` state). The token is released for reuse by future workflows. |
 
 ### Wait Events
 

From 4c5fd4c06bf0ab0c6e4483338d92ebb5fa4cc3df Mon Sep 17 00:00:00 2001
From: Pranay Prakash <pranay.gp@gmail.com>
Date: Tue, 23 Dec 2025 23:54:43 -0800
Subject: [PATCH 27/27] Add Entity IDs section to event sourcing docs
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Documents the consistent ID format used across all entities:
- 4-character prefix + underscore + ULID
- Prefixes: wrun_, step_, hook_, wait_, evnt_, strm_
- Explains benefits: easy introspection and chronological ordering

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
---
 .../docs/how-it-works/event-sourcing.mdx      | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/docs/content/docs/how-it-works/event-sourcing.mdx b/docs/content/docs/how-it-works/event-sourcing.mdx
index a4a5d80af..c2ca4e6b3 100644
--- a/docs/content/docs/how-it-works/event-sourcing.mdx
+++ b/docs/content/docs/how-it-works/event-sourcing.mdx
@@ -226,3 +226,22 @@ This correlation enables:
 - Querying all events for a specific step, hook, or wait
 - Building timelines of entity lifecycle transitions
 - Debugging by tracing the complete history of any entity
+
+## Entity IDs
+
+All entities in the Workflow DevKit use a consistent ID format: a 4-character prefix followed by an underscore and a [ULID](https://github.com/ulid/spec) (Universally Unique Lexicographically Sortable Identifier).
+
+| Entity | Prefix | Example |
+|--------|--------|---------|
+| Run | `wrun_` | `wrun_01HXYZ123ABC456DEF789GHJ` |
+| Step | `step_` | `step_01HXYZ123ABC456DEF789GHJ` |
+| Hook | `hook_` | `hook_01HXYZ123ABC456DEF789GHJ` |
+| Wait | `wait_` | `wait_01HXYZ123ABC456DEF789GHJ` |
+| Event | `evnt_` | `evnt_01HXYZ123ABC456DEF789GHJ` |
+| Stream | `strm_` | `strm_01HXYZ123ABC456DEF789GHJ` |
+
+**Why this format?**
+
+- **Prefixes enable introspection**: Given any ID, you can immediately identify what type of entity it refers to. This makes debugging, logging, and cross-referencing entities across the system straightforward.
+
+- **ULIDs enable chronological ordering**: Unlike UUIDs, ULIDs encode a timestamp in their first 48 bits, making them lexicographically sortable by creation time. This property is essential for the event log—events are always stored and retrieved in the correct chronological order simply by sorting their IDs.