Add true streaming API with stream_start/3,4 and stream_cancel/1

benoitc · benoitc · commit f9835c84d869 · 2026-03-23T15:12:32.000+01:00
New event-driven streaming functions that send {py_stream, Ref, Event}
messages as values are yielded from Python generators:

- py:stream_start/3,4 - Start streaming, returns immediately with ref
- py:stream_cancel/1 - Cancel an active stream

Events sent to owner process:
- {py_stream, Ref, {data, Value}} - Each yielded value
- {py_stream, Ref, done} - Stream completed
- {py_stream, Ref, {error, Reason}} - Stream error

Unlike py:stream/3,4 which collects all values at once, stream_start
sends events incrementally. Useful for LLM token streaming, real-time
data feeds, and processing large sequences without memory accumulation.

Also fixes inaccurate comment in py_channel.erl about Python API.
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -2,6 +2,14 @@
 
 ## 2.2.0 (unreleased)
 
+### Added
+
+- **True streaming API** - New `py:stream_start/3,4` and `py:stream_cancel/1` functions
+  for event-driven streaming from Python generators. Unlike `py:stream/3,4` which
+  collects all values at once, `stream_start` sends `{py_stream, Ref, {data, Value}}`
+  messages as values are yielded. Supports both sync and async generators. Useful for
+  LLM token streaming, real-time data feeds, and processing large sequences incrementally.
+
 ### Fixed
 
 - **Channel notification for create_task** - Fixed async channel receive hanging when using
diff --git a/docs/streaming.md b/docs/streaming.md
@@ -6,11 +6,83 @@ This guide covers working with Python generators from Erlang.
 
 Python generators allow processing large datasets or infinite sequences
 efficiently by yielding values one at a time. erlang_python supports
-streaming these values back to Erlang.
+two modes of streaming:
 
-## Generator Expressions
+1. **Batch streaming** (`py:stream/3,4`, `py:stream_eval/1,2`) - Collects all values into a list
+2. **True streaming** (`py:stream_start/3,4`) - Sends events as values are yielded
 
-The simplest way to stream is with generator expressions:
+## True Streaming (Event-driven)
+
+For real-time processing where you need values as they arrive (e.g., LLM tokens,
+live data feeds), use `py:stream_start/3,4`:
+
+```erlang
+%% Start streaming from a Python iterator
+{ok, Ref} = py:stream_start(builtins, iter, [[1,2,3,4,5]]),
+
+%% Receive events as values are yielded
+receive_loop(Ref).
+
+receive_loop(Ref) ->
+    receive
+        {py_stream, Ref, {data, Value}} ->
+            io:format("Got: ~p~n", [Value]),
+            receive_loop(Ref);
+        {py_stream, Ref, done} ->
+            io:format("Complete~n");
+        {py_stream, Ref, {error, Reason}} ->
+            io:format("Error: ~p~n", [Reason])
+    after 30000 ->
+        timeout
+    end.
+```
+
+### Events
+
+The stream sends these messages to the owner process:
+
+- `{py_stream, Ref, {data, Value}}` - Each yielded value
+- `{py_stream, Ref, done}` - Stream completed successfully
+- `{py_stream, Ref, {error, Reason}}` - Stream error
+
+### Options
+
+```erlang
+%% Send events to a different process
+{ok, Ref} = py:stream_start(Module, Func, Args, #{owner => OtherPid}).
+```
+
+### Cancellation
+
+Cancel an active stream:
+
+```erlang
+{ok, Ref} = py:stream_start(my_module, long_generator, []),
+%% ... receive some values ...
+ok = py:stream_cancel(Ref).
+%% Stream will stop on next iteration
+```
+
+### Async Generators
+
+`stream_start` supports both sync and async generators:
+
+```erlang
+%% Async generator (e.g., streaming from an async API)
+ok = py:exec(<<"
+async def async_gen():
+    for i in range(5):
+        await asyncio.sleep(0.1)
+        yield i
+">>),
+{ok, Ref} = py:stream_start('__main__', async_gen, []).
+```
+
+## Batch Streaming (Collecting All Values)
+
+For simpler use cases where you want all values at once:
+
+### Generator Expressions
 
 ```erlang
 %% Stream squares of numbers 0-9
@@ -26,7 +98,7 @@ The simplest way to stream is with generator expressions:
 %% Evens = [0,2,4,6,8,10,12,14,16,18]
 ```
 
-## Iterator Objects
+### Iterator Objects
 
 Any Python iterator can be streamed:
 
@@ -40,7 +112,7 @@ Any Python iterator can be streamed:
 %% Items = [{<<"a">>, 1}, {<<"b">>, 2}]
 ```
 
-## Generator Functions
+### Generator Functions
 
 Define generator functions with `yield`:
 
@@ -69,46 +141,44 @@ For reliable inline generators, use lambda with walrus operator (Python 3.8+):
 %% Fib = [0,1,1,2,3,5,8,13,21,34]
 ```
 
-## Streaming Protocol
+## When to Use Each Mode
 
-Internally, streaming uses these messages:
+| Use Case | Recommended API |
+|----------|-----------------|
+| LLM token streaming | `stream_start/3,4` |
+| Real-time data feeds | `stream_start/3,4` |
+| Live progress updates | `stream_start/3,4` |
+| Batch processing | `stream/3,4` or `stream_eval/1,2` |
+| Small datasets | `stream/3,4` or `stream_eval/1,2` |
+| One-time collection | `stream/3,4` or `stream_eval/1,2` |
 
-```erlang
-{py_chunk, Ref, Value}   %% Each yielded value
-{py_end, Ref}            %% Generator exhausted
-{py_error, Ref, Error}   %% Exception occurred
-```
+## Memory Considerations
 
-You can build custom streaming consumers:
+- `stream_start`: Low memory - values processed as they arrive
+- `stream/stream_eval`: Values collected into a list - memory grows with output size
+- Generators are garbage collected after exhaustion
+
+## Use Cases
+
+### LLM Token Streaming
 
 ```erlang
-start_stream(Code) ->
-    Ref = make_ref(),
-    py_pool:request({stream_eval, Ref, self(), Code, #{}}),
-    process_stream(Ref).
+%% Stream tokens from an LLM
+{ok, Ref} = py:stream_start(llm_client, generate_tokens, [Prompt]),
+stream_to_client(Ref, WebSocket).
 
-process_stream(Ref) ->
+stream_to_client(Ref, WS) ->
     receive
-        {py_chunk, Ref, Value} ->
-            io:format("Got: ~p~n", [Value]),
-            process_stream(Ref);
-        {py_end, Ref} ->
-            io:format("Done~n");
-        {py_error, Ref, Error} ->
-            io:format("Error: ~p~n", [Error])
-    after 30000 ->
-        io:format("Timeout~n")
+        {py_stream, Ref, {data, Token}} ->
+            websocket:send(WS, Token),
+            stream_to_client(Ref, WS);
+        {py_stream, Ref, done} ->
+            websocket:send(WS, <<"[DONE]">>);
+        {py_stream, Ref, {error, _}} ->
+            websocket:send(WS, <<"[ERROR]">>)
     end.
 ```
 
-## Memory Considerations
-
-- Values are collected into a list by `stream_eval/1,2`
-- For large datasets, consider processing chunks as they arrive
-- Generators are garbage collected after exhaustion
-
-## Use Cases
-
 ### Data Processing Pipelines
 
 ```erlang
@@ -119,22 +189,6 @@ process_stream(Ref) ->
 Results = [process_line(L) || L <- Lines].
 ```
 
-### Infinite Sequences
-
-```erlang
-%% Define infinite counter
-ok = py:exec(<<"
-def counter():
-    n = 0
-    while True:
-        yield n
-        n += 1
-">>).
-
-%% Take first 100 (use your own take function)
-%% Can't use stream/3 directly for infinite - need custom handling
-```
-
 ### Batch Processing
 
 ```erlang
diff --git a/src/py.erl b/src/py.erl
@@ -56,6 +56,9 @@
     stream/4,
     stream_eval/1,
     stream_eval/2,
+    stream_start/3,
+    stream_start/4,
+    stream_cancel/1,
     version/0,
     memory_stats/0,
     gc/0,
@@ -468,6 +471,134 @@ stream_eval(Code, Locals) ->
     WrappedCode = <<"list(", CodeBin/binary, ")">>,
     py_context:eval(Ctx, WrappedCode, Locals).
 
+%%% ============================================================================
+%%% True Streaming API (Event-driven)
+%%% ============================================================================
+
+%% @doc Start a true streaming iteration from a Python generator.
+%%
+%% Unlike stream/3,4 which collects all values at once, this function
+%% returns immediately with a reference and sends values as events
+%% to the calling process as they are yielded.
+%%
+%% Events sent to the owner process:
+%% - `{py_stream, Ref, {data, Value}}' - Each yielded value
+%% - `{py_stream, Ref, done}' - Stream completed
+%% - `{py_stream, Ref, {error, Reason}}' - Stream error
+%%
+%% Supports both sync generators and async generators (coroutines).
+%%
+%% Example:
+%% ```
+%% {ok, Ref} = py:stream_start(builtins, iter, [[1,2,3,4,5]]),
+%% receive_loop(Ref).
+%%
+%% receive_loop(Ref) ->
+%%     receive
+%%         {py_stream, Ref, {data, Value}} ->
+%%             io:format("Got: ~p~n", [Value]),
+%%             receive_loop(Ref);
+%%         {py_stream, Ref, done} ->
+%%             io:format("Complete~n");
+%%         {py_stream, Ref, {error, Reason}} ->
+%%             io:format("Error: ~p~n", [Reason])
+%%     after 30000 ->
+%%         timeout
+%%     end.
+%% '''
+-spec stream_start(py_module(), py_func(), py_args()) -> {ok, reference()}.
+stream_start(Module, Func, Args) ->
+    stream_start(Module, Func, Args, #{}).
+
+%% @doc Start a true streaming iteration with options.
+%%
+%% Options:
+%% - `owner => pid()' - Process to receive events (default: self())
+%%
+%% @param Module Python module name
+%% @param Func Python function name
+%% @param Args Function arguments
+%% @param Opts Options map
+%% @returns {ok, Ref} where Ref is used to identify stream events
+-spec stream_start(py_module(), py_func(), py_args(), map()) -> {ok, reference()}.
+stream_start(Module, Func, Args, Opts) ->
+    Owner = maps:get(owner, Opts, self()),
+    Ref = make_ref(),
+    ModuleBin = ensure_binary(Module),
+    FuncBin = ensure_binary(Func),
+    RefHash = erlang:phash2(Ref),
+    %% Store owner and ref for Python to retrieve
+    %% Use binary keys because Python strings become binaries
+    py_state:store({<<"stream_owner">>, RefHash}, Owner),
+    py_state:store({<<"stream_ref">>, RefHash}, Ref),
+    py_state:store({<<"stream_args">>, RefHash}, Args),
+    %% Spawn an Erlang process to run the streaming iteration
+    spawn(fun() ->
+        stream_run_python(ModuleBin, FuncBin, RefHash)
+    end),
+    {ok, Ref}.
+
+%% @private Run the streaming via Python code
+stream_run_python(ModuleBin, FuncBin, RefHash) ->
+    RefHashBin = integer_to_binary(RefHash),
+    %% Build Python code that streams values using callbacks
+    Code = iolist_to_binary([
+        <<"import erlang\n">>,
+        <<"_rh = ">>, RefHashBin, <<"\n">>,
+        <<"_args = erlang.call('state_get', ('stream_args', _rh))\n">>,
+        <<"if _args is None:\n">>,
+        <<"    _args = []\n">>,
+        <<"try:\n">>,
+        <<"    _mod = __import__('">>, ModuleBin, <<"')\n">>,
+        <<"    _fn = getattr(_mod, '">>, FuncBin, <<"')\n">>,
+        <<"    _gen = _fn(*_args) if _args else _fn()\n">>,
+        <<"    for _val in _gen:\n">>,
+        <<"        if erlang.call('_py_stream_cancelled', _rh):\n">>,
+        <<"            erlang.call('_py_stream_send', _rh, 'error', 'cancelled')\n">>,
+        <<"            break\n">>,
+        <<"        erlang.call('_py_stream_send', _rh, 'data', _val)\n">>,
+        <<"    else:\n">>,
+        <<"        erlang.call('_py_stream_send', _rh, 'done', None)\n">>,
+        <<"except Exception as _e:\n">>,
+        <<"    erlang.call('_py_stream_send', _rh, 'error', str(_e))\n">>,
+        <<"finally:\n">>,
+        <<"    erlang.call('_py_stream_cleanup', _rh)\n">>
+    ]),
+    %% Execute the streaming code
+    case exec(Code) of
+        ok -> ok;
+        {error, Reason} ->
+            %% Try to notify owner of error
+            case py_state:fetch({<<"stream_owner">>, RefHash}) of
+                {ok, Owner} ->
+                    case py_state:fetch({<<"stream_ref">>, RefHash}) of
+                        {ok, Ref} ->
+                            Owner ! {py_stream, Ref, {error, Reason}},
+                            py_state:remove({<<"stream_owner">>, RefHash}),
+                            py_state:remove({<<"stream_ref">>, RefHash}),
+                            py_state:remove({<<"stream_args">>, RefHash});
+                        _ -> ok
+                    end;
+                _ -> ok
+            end
+    end.
+
+%% @doc Cancel an active stream.
+%%
+%% Sends a cancellation signal to stop the stream iteration.
+%% Any pending values may still be delivered before the stream stops.
+%%
+%% @param Ref The stream reference from stream_start/3,4
+%% @returns ok
+-spec stream_cancel(reference()) -> ok.
+stream_cancel(Ref) when is_reference(Ref) ->
+    %% Store cancellation flag that the streaming task checks
+    %% Use hash because we can't pass Erlang refs to Python callbacks easily
+    %% Use binary key because Python strings become binaries
+    RefHash = erlang:phash2(Ref),
+    py_state:store({<<"stream_cancelled_hash">>, RefHash}, true),
+    ok.
+
 %%% ============================================================================
 %%% Info
 %%% ============================================================================
diff --git a/src/py_channel.erl b/src/py_channel.erl
@@ -26,8 +26,8 @@
 %%% %% Send messages to Python
 %%% ok = py_channel:send(Ch, {request, self(), <<"data">>}),
 %%%
-%%% %% Python receives via channel.receive()
-%%% %% Python sends back via erlang.channel_reply(pid, term)
+%%% %% Python: ch = Channel(ref); msg = ch.receive()
+%%% %% Python: reply(pid, term)
 %%%
 %%% %% Close when done
 %%% py_channel:close(Ch).
diff --git a/src/py_state.erl b/src/py_state.erl
diff --git a/test/py_stream_SUITE.erl b/test/py_stream_SUITE.erl