luagent/test_luagent.lua at main · jeffmm/luagent · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
--[[
  luagent_test.lua - Comprehensive tests for luagent library

  Run with: lua luagent_test.lua
--]]

local luagent = require("luagent")

-- Simple test framework
local tests_passed = 0
local tests_failed = 0
local current_test = ""

---@param name string
---@param func fun()
local function test(name, func)
	current_test = name
	io.write("Testing: " .. name .. " ... ")
	local ok, err = pcall(func)
	if ok then
		io.write("PASSED\n")
		tests_passed = tests_passed + 1
	else
		io.write("FAILED\n")
		io.write("  Error: " .. tostring(err) .. "\n")
		tests_failed = tests_failed + 1
	end
end

---@param actual any
---@param expected any
---@param msg? string
local function assert_eq(actual, expected, msg)
	if actual ~= expected then
		error((msg or "Assertion failed") .. ": expected " .. tostring(expected) .. ", got " .. tostring(actual))
	end
end

---@param value any
---@param msg? string
local function assert_true(value, msg)
	if not value then
		error(msg or "Expected true, got false")
	end
end

---@param value any
---@param msg? string
local function assert_false(value, msg)
	if value then
		error(msg or "Expected false, got true")
	end
end

---@param value any
---@param msg? string
local function assert_nil(value, msg)
	if value ~= nil then
		error(msg or "Expected nil, got " .. tostring(value))
	end
end

---@param value any
---@param msg? string
local function assert_not_nil(value, msg)
	if value == nil then
		error(msg or "Expected non-nil value")
	end
end

---@param value any
---@param expected_type string
---@param msg? string
local function assert_type(value, expected_type, msg)
	local actual_type = type(value)
	if actual_type ~= expected_type then
		error((msg or "Type mismatch") .. ": expected " .. expected_type .. ", got " .. actual_type)
	end
end

---@param haystack string|table
---@param needle any
---@param msg? string
local function assert_contains(haystack, needle, msg)
	if type(haystack) == "string" then
		if not haystack:find(needle, 1, true) then
			error(msg or "String does not contain expected substring")
		end
	elseif type(haystack) == "table" then
		local found = false
		for _, v in pairs(haystack) do
			if v == needle then
				found = true
				break
			end
		end
		if not found then
			error(msg or "Table does not contain expected value")
		end
	end
end

---@param func fun()
---@param expected_msg? string
local function assert_error(func, expected_msg)
	local ok, err = pcall(func)
	if ok then
		error("Expected function to throw error")
	end
	if expected_msg and not string.find(tostring(err), expected_msg, 1, true) then
		error("Error message mismatch: expected '" .. expected_msg .. "' in '" .. tostring(err) .. "'")
	end
end

-- Tests

-- Test 1: Schema validation - valid object
test("Schema validation: valid object", function()
	local schema = {
		type = "object",
		properties = {
			name = { type = "string" },
			age = { type = "number" },
		},
		required = { "name" },
	}

	local value = { name = "Alice", age = 30 }
	local ok, err = luagent.validate_schema(value, schema)

	assert_true(ok, "Validation should succeed")
	assert_nil(err, "Error should be nil")
end)

-- Test 2: Schema validation - missing required field
test("Schema validation: missing required field", function()
	local schema = {
		type = "object",
		properties = {
			name = { type = "string" },
			age = { type = "number" },
		},
		required = { "name" },
	}

	local value = { age = 30 }
	local ok, err = luagent.validate_schema(value, schema)

	assert_false(ok, "Validation should fail")
	assert_not_nil(err, "Error should not be nil")
	assert_contains(err, "name", "Error should mention missing field")
end)

-- Test 3: Schema validation - wrong type
test("Schema validation: wrong type", function()
	local schema = {
		type = "object",
		properties = {
			age = { type = "number" },
		},
	}

	local value = { age = "thirty" }
	local ok, err = luagent.validate_schema(value, schema)

	assert_false(ok, "Validation should fail")
	assert_contains(err, "number", "Error should mention expected type")
end)

-- Test 4: Schema validation - nested objects
test("Schema validation: nested objects", function()
	local schema = {
		type = "object",
		properties = {
			user = {
				type = "object",
				properties = {
					name = { type = "string" },
				},
				required = { "name" },
			},
		},
	}

	local value = { user = { name = "Bob" } }
	local ok, err = luagent.validate_schema(value, schema)

	assert_true(ok, "Validation should succeed")
	assert_nil(err, "Error should be nil")
end)

-- Test 5: Schema validation - arrays
test("Schema validation: arrays", function()
	local schema = {
		type = "array",
		items = { type = "number" },
	}

	local value = { 1, 2, 3, 4, 5 }
	local ok, err = luagent.validate_schema(value, schema)

	assert_true(ok, "Validation should succeed")
	assert_nil(err, "Error should be nil")
end)

-- Test 6: Schema validation - invalid array items
test("Schema validation: invalid array items", function()
	local schema = {
		type = "array",
		items = { type = "number" },
	}

	local value = { 1, 2, "three", 4 }
	local ok, err = luagent.validate_schema(value, schema)

	assert_false(ok, "Validation should fail")
	assert_contains(err, "Array item", "Error should mention array item")
end)

-- Test 7: Agent creation - basic
test("Agent creation: basic configuration", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		system_prompt = "You are helpful",
	})

	assert_not_nil(agent, "Agent should be created")
	assert_eq(agent.model, "gpt-4", "Model should be set")
	assert_eq(agent.system_prompt, "You are helpful", "System prompt should be set")
end)

-- Test 8: Agent creation - missing model
test("Agent creation: missing model throws error", function()
	assert_error(function()
		luagent.Agent.new({
			system_prompt = "Test",
		})
	end, "model is required")
end)

-- Test 9: Agent creation - with tools
test("Agent creation: with tools", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		tools = {
			get_time = {
				description = "Get current time",
				parameters = {
					type = "object",
					properties = {},
				},
				func = function(ctx, args)
					return { time = "12:00" }
				end,
			},
		},
	})

	assert_not_nil(agent._tool_map.get_time, "Tool should be registered")
	assert_eq(agent._tool_map.get_time.description, "Get current time")
end)

-- Test 10: Agent creation - with output schema
test("Agent creation: with output schema", function()
	local schema = {
		type = "object",
		properties = {
			answer = { type = "string" },
		},
	}

	local agent = luagent.Agent.new({
		model = "gpt-4",
		output_schema = schema,
	})

	assert_not_nil(agent.output_schema, "Output schema should be set")
	assert_eq(agent.output_schema.type, "object")
end)

-- Test 11: Dynamic system prompt
test("Agent: dynamic system prompt", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		system_prompt = function(ctx)
			return "You are a " .. ctx.deps.role .. " assistant"
		end,
	})

	local ctx = luagent.RunContext.new({ role = "helpful" })
	local prompt = agent:_build_system_prompt(ctx)

	assert_eq(prompt, "You are a helpful assistant")
end)

-- Test 12: Building tools for OpenAI API
test("Agent: building tools for OpenAI API", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		tools = {
			add = {
				description = "Add two numbers",
				parameters = {
					type = "object",
					properties = {
						a = { type = "number" },
						b = { type = "number" },
					},
				},
				func = function(ctx, args)
					return { result = args.a + args.b }
				end,
			},
		},
	})

	local tools = agent:_build_tools()

	assert_eq(#tools, 1, "Should have one tool")
	assert_eq(tools[1].type, "function")
	assert_eq(tools[1]["function"].name, "add")
	assert_eq(tools[1]["function"].description, "Add two numbers")
end)

-- Test 13: RunContext creation
test("RunContext: creation and access", function()
	local deps = { api_key = "test-key", user_id = 123 }
	local messages = { { role = "user", content = "Hello" } }

	local ctx = luagent.RunContext.new(deps, messages)

	assert_not_nil(ctx, "Context should be created")
	assert_eq(ctx.deps.api_key, "test-key")
	assert_eq(ctx.deps.user_id, 123)
	assert_eq(#ctx.messages, 1)
end)

-- Test 14: Tool execution
test("Agent: tool execution", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		tools = {
			greet = {
				description = "Greet a user",
				parameters = {
					type = "object",
					properties = {
						name = { type = "string" },
					},
				},
				func = function(ctx, args)
					return { greeting = "Hello, " .. args.name .. "!" }
				end,
			},
		},
	})

	local ctx = luagent.RunContext.new({})
	local tool_call = {
		id = "call_123",
		["function"] = {
			name = "greet",
			arguments = '{"name":"Alice"}',
		},
	}

	local result = agent:_execute_tool_call(tool_call, ctx)
	local parsed = luagent._json.decode(result)

	assert_eq(parsed.greeting, "Hello, Alice!")
end)

-- Test 15: Tool execution with context deps
test("Agent: tool execution with context dependencies", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		tools = {
			get_user_info = {
				description = "Get user info",
				parameters = {
					type = "object",
					properties = {},
				},
				func = function(ctx, args)
					return { user = ctx.deps.current_user }
				end,
			},
		},
	})

	local ctx = luagent.RunContext.new({ current_user = "Alice" })
	local tool_call = {
		id = "call_456",
		["function"] = {
			name = "get_user_info",
			arguments = "{}",
		},
	}

	local result = agent:_execute_tool_call(tool_call, ctx)
	local parsed = luagent._json.decode(result)

	assert_eq(parsed.user, "Alice")
end)

-- Test 16: Tool error handling
test("Agent: tool execution error handling", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		tools = {
			failing_tool = {
				description = "This tool fails",
				parameters = { type = "object", properties = {} },
				func = function(ctx, args)
					error("Something went wrong")
				end,
			},
		},
	})

	local ctx = luagent.RunContext.new({})
	local tool_call = {
		id = "call_789",
		["function"] = {
			name = "failing_tool",
			arguments = "{}",
		},
	}

	local result = agent:_execute_tool_call(tool_call, ctx)
	local parsed = luagent._json.decode(result)

	assert_not_nil(parsed.error, "Should return error")
	assert_contains(parsed.error, "Tool execution failed")
end)

-- Test 17: Unknown tool handling
test("Agent: unknown tool handling", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
	})

	local ctx = luagent.RunContext.new({})
	local tool_call = {
		id = "call_999",
		["function"] = {
			name = "nonexistent_tool",
			arguments = "{}",
		},
	}

	local result = agent:_execute_tool_call(tool_call, ctx)
	local parsed = luagent._json.decode(result)

	assert_not_nil(parsed.error, "Should return error")
	assert_contains(parsed.error, "not found")
end)

-- Test 18: JSON encoding/decoding
test("JSON: encode and decode", function()
	local original = {
		name = "Alice",
		age = 30,
		active = true,
		tags = { "user", "premium" },
	}

	local encoded = luagent._json.encode(original)
	assert_type(encoded, "string")

	-- Note: decode test depends on having a proper JSON library installed
	-- The fallback decoder is minimal and may not work for complex objects
end)

-- Test 19: Schema validation - all primitive types
test("Schema validation: primitive types", function()
	assert_true(luagent.validate_schema("hello", { type = "string" }))
	assert_true(luagent.validate_schema(42, { type = "number" }))
	assert_true(luagent.validate_schema(true, { type = "boolean" }))
	assert_true(luagent.validate_schema({}, { type = "object" }))
	assert_true(luagent.validate_schema({}, { type = "array" }))
end)

-- Test 20: Agent configuration defaults
test("Agent: configuration defaults", function()
	local agent = luagent.Agent.new({
		model = "gpt-4o-mini",
	})

	assert_eq(agent.base_url, "https://api.openai.com/v1")
	assert_type(agent.tools, "table")
	assert_eq(next(agent.tools), nil, "Tools should be empty by default")
end)

-- Test 21: Provider detection - returns config when API key exists
test("Provider detection: returns config structure", function()
	local config = luagent.detect_provider()

	-- If any API key is set in the environment, we should get a config
	if config then
		assert_not_nil(config.base_url, "Config should have base_url")
		assert_not_nil(config.model, "Config should have model")
		assert_not_nil(config.api_key, "Config should have api_key")
		assert_not_nil(config.provider, "Config should have provider name")
		assert_type(config.base_url, "string")
		assert_type(config.model, "string")
		assert_type(config.api_key, "string")
		assert_type(config.provider, "string")
	end
	-- If no API key is set, config will be nil, which is also valid
end)

-- Test 22: Using detect_provider with Agent
test("Provider detection: integration with Agent.new", function()
	local config = luagent.detect_provider()

	if config then
		-- Should be able to create an agent using detected config
		local agent = luagent.Agent.new({
			model = config.model,
			base_url = config.base_url,
			api_key = config.api_key,
		})

		assert_not_nil(agent)
		assert_eq(agent.model, config.model)
		assert_eq(agent.base_url, config.base_url)
		assert_eq(agent.api_key, config.api_key)
	end
end)

-- Test 23: SSE parsing
test("SSE parsing: basic chunks", function()
	local sse_text = [[data: {"id":"chatcmpl-123","object":"chat.completion.chunk","choices":[{"delta":{"content":"Hello"},"index":0}]}
data: {"id":"chatcmpl-123","object":"chat.completion.chunk","choices":[{"delta":{"content":" World"},"index":0}]}
data: [DONE]
]]

	-- Access internal parse_sse function via luagent internals
	-- For testing, we'll need to expose it or test via streaming
	-- For now, let's test the streaming API directly
	assert_true(true) -- Placeholder for SSE parsing test
end)

-- Test 24: Streaming - basic content
test("Streaming: basic content streaming", function()
	local chunks_received = {}

	local agent = luagent.Agent.new({
		model = "gpt-4",
		http_client = {
			post = function(url, headers, body, on_chunk)
				-- Return a mock SSE response
				local sse_response = [[data: {"id":"chatcmpl-123","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"role":"assistant","content":"Hello"},"finish_reason":null}]}
data: {"id":"chatcmpl-123","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"content":" World"},"finish_reason":null}]}
data: {"id":"chatcmpl-123","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{},"finish_reason":"stop"}]}
data: [DONE]
]]
				-- Simulate streaming by calling on_chunk with the response
				if on_chunk then
					on_chunk(sse_response)
				end
				return 200, sse_response
			end,
		},
	})

	local result = agent:run("Test", {
		stream = true,
		on_chunk = function(chunk_type, data)
			table.insert(chunks_received, { type = chunk_type, data = data })
		end,
	})

	-- Should have received content chunks
	assert_true(#chunks_received >= 2, "Should receive at least 2 content chunks")

	-- Check that we got content chunks
	local has_content = false
	for _, chunk in ipairs(chunks_received) do
		if chunk.type == "content" then
			has_content = true
			break
		end
	end
	assert_true(has_content, "Should have content chunks")

	-- Final result should contain accumulated content
	assert_not_nil(result.data, "Result should have data")
	assert_contains(result.data, "Hello", "Result should contain streamed content")
end)

-- Test 25: Streaming - tool calls
test("Streaming: tool call streaming", function()
	local chunks_received = {}
	local call_count = 0

	local agent = luagent.Agent.new({
		model = "gpt-4",
		tools = {
			get_weather = {
				description = "Get weather",
				parameters = {
					type = "object",
					properties = {
						city = { type = "string" },
					},
				},
				func = function(ctx, args)
					return { temperature = 72, city = args.city }
				end,
			},
		},
		http_client = {
			post = function(url, headers, body, on_chunk)
				call_count = call_count + 1

				if call_count == 1 then
					-- First call: return tool call in streaming format
					local sse_response = [[data: {"id":"chatcmpl-456","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"role":"assistant","content":null,"tool_calls":[{"index":0,"id":"call_abc123","type":"function","function":{"name":"get_weather","arguments":""}}]},"finish_reason":null}]}
data: {"id":"chatcmpl-456","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"{\"city\""}}]},"finish_reason":null}]}
data: {"id":"chatcmpl-456","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":":\"Paris\"}"}}]},"finish_reason":null}]}
data: {"id":"chatcmpl-456","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{},"finish_reason":"tool_calls"}]}
data: [DONE]
]]
					if on_chunk then
						on_chunk(sse_response)
					end
					return 200, sse_response
				else
					-- Second call: return final response in streaming format
					local sse_response = [[data: {"id":"chatcmpl-789","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"role":"assistant","content":"The"},"finish_reason":null}]}
data: {"id":"chatcmpl-789","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"content":" weather is 72"},"finish_reason":null}]}
data: {"id":"chatcmpl-789","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{},"finish_reason":"stop"}]}
data: [DONE]
]]
					if on_chunk then
						on_chunk(sse_response)
					end
					return 200, sse_response
				end
			end,
		},
	})

	local result = agent:run("What's the weather?", {
		stream = true,
		on_chunk = function(chunk_type, data)
			table.insert(chunks_received, { type = chunk_type, data = data })
		end,
	})

	-- Should have received tool call chunks
	local has_tool_call_start = false
	local has_tool_call_delta = false
	local has_tool_call_end = false

	for _, chunk in ipairs(chunks_received) do
		if chunk.type == "tool_call_start" then
			has_tool_call_start = true
		elseif chunk.type == "tool_call_delta" then
			has_tool_call_delta = true
		elseif chunk.type == "tool_call_end" then
			has_tool_call_end = true
		end
	end

	assert_true(has_tool_call_start, "Should have tool_call_start chunk")
	assert_true(has_tool_call_delta, "Should have tool_call_delta chunk")
	assert_true(has_tool_call_end, "Should have tool_call_end chunk")

	-- Should have final result
	assert_not_nil(result.data, "Should have final result")
end)

-- Test 26: Tool-based output - auto-registration
test("Tool-based output: output tool auto-registered", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		output_schema = {
			type = "object",
			properties = {
				answer = { type = "string" },
			},
		},
	})

	-- Output tool should be auto-registered
	assert_not_nil(agent._output_tool_name, "Output tool name should be set")
	assert_not_nil(agent._tool_map[agent._output_tool_name], "Output tool should be registered")
	assert_eq(agent._tool_map[agent._output_tool_name].parameters, agent.output_schema, "Output tool parameters should match schema")
end)

-- Test 27: Streaming - backwards compatibility (stream=false)
test("Streaming: backwards compatibility with stream disabled", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		http_client = {
			post = function(url, headers, body)
				-- Regular non-streaming response
				return 200, '{"id":"chatcmpl-789","choices":[{"message":{"role":"assistant","content":"Hello"}}]}'
			end,
		},
	})

	-- Run without streaming (default behavior)
	local result = agent:run("Test")

	assert_not_nil(result.data, "Should have result data")
	assert_eq(result.data, "Hello", "Should have non-streamed content")
end)

-- Test 28: Tool-based output - system prompt modification
test("Tool-based output: system prompt includes output tool instruction", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		system_prompt = "You are helpful",
		output_schema = {
			type = "object",
			properties = {
				answer = { type = "string" },
			},
		},
	})

	local ctx = luagent.RunContext.new({})
	local prompt = agent:_build_system_prompt(ctx)

	assert_contains(prompt, "You are helpful", "Should include base system prompt")
	assert_contains(prompt, "final_answer", "Should mention output tool name")
	assert_contains(prompt, "MUST call", "Should instruct to call the tool")
end)

-- Test 29: Tool-based output - non-streaming execution
test("Tool-based output: non-streaming structured output", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		output_schema = {
			type = "object",
			properties = {
				answer = { type = "string" },
				confidence = { type = "number" },
			},
			required = { "answer" },
		},
		http_client = {
			post = function(url, headers, body)
				-- Mock response with output tool call
				return 200, [[{
					"id": "chatcmpl-123",
					"choices": [{
						"message": {
							"role": "assistant",
							"content": null,
							"tool_calls": [{
								"id": "call_abc",
								"type": "function",
								"function": {
									"name": "final_answer",
									"arguments": "{\"answer\":\"42\",\"confidence\":0.95}"
								}
							}]
						}
					}]
				}]]
			end,
		},
	})

	local result = agent:run("What is the answer?")

	assert_not_nil(result.data, "Should have structured data")
	assert_eq(result.data.answer, "42", "Should have correct answer")
	assert_eq(result.data.confidence, 0.95, "Should have correct confidence")
end)

-- Test 30: Tool-based output - streaming structured output
test("Tool-based output: streaming structured output", function()
	local chunks_received = {}

	local agent = luagent.Agent.new({
		model = "gpt-4",
		output_schema = {
			type = "object",
			properties = {
				result = { type = "string" },
			},
		},
		http_client = {
			post = function(url, headers, body, on_chunk)
				-- Mock streaming response with output tool call
				local sse_response = [[data: {"id":"chatcmpl-456","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"role":"assistant","content":null,"tool_calls":[{"index":0,"id":"call_xyz","type":"function","function":{"name":"final_answer","arguments":""}}]},"finish_reason":null}]}
data: {"id":"chatcmpl-456","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"{\"result\""}}]},"finish_reason":null}]}
data: {"id":"chatcmpl-456","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":":\"Success\"}"}}]},"finish_reason":null}]}
data: {"id":"chatcmpl-456","object":"chat.completion.chunk","created":1234567890,"model":"gpt-4","choices":[{"index":0,"delta":{},"finish_reason":"tool_calls"}]}
data: [DONE]
]]
				if on_chunk then
					on_chunk(sse_response)
				end
				return 200, sse_response
			end,
		},
	})

	local result = agent:run("Test query", {
		stream = true,
		on_chunk = function(chunk_type, data)
			table.insert(chunks_received, { type = chunk_type, data = data })
		end,
	})

	-- Should receive tool call chunks during streaming
	local has_tool_chunks = false
	for _, chunk in ipairs(chunks_received) do
		if chunk.type == "tool_call_start" or chunk.type == "tool_call_delta" or chunk.type == "tool_call_end" then
			has_tool_chunks = true
			break
		end
	end
	assert_true(has_tool_chunks, "Should receive tool call chunks during streaming")

	-- Final result should be validated structured data
	assert_not_nil(result.data, "Should have structured data")
	assert_eq(result.data.result, "Success", "Should have correct structured result")
end)

-- Test 31: Tool-based output - validation failure
test("Tool-based output: schema validation failure", function()
	local agent = luagent.Agent.new({
		model = "gpt-4",
		output_schema = {
			type = "object",
			properties = {
				count = { type = "number" },
			},
			required = { "count" },
		},
		http_client = {
			post = function(url, headers, body)
				-- Mock response with invalid data (missing required field)
				return 200, [[{
					"id": "chatcmpl-789",
					"choices": [{
						"message": {
							"role": "assistant",
							"content": null,
							"tool_calls": [{
								"id": "call_def",
								"type": "function",
								"function": {
									"name": "final_answer",
									"arguments": "{\"wrong_field\":\"value\"}"
								}
							}]
						}
					}]
				}]]
			end,
		},
	})

	assert_error(function()
		agent:run("Test")
	end, "validation failed")
end)

-- Test 32: Tool-based output - mixing with regular tools
test("Tool-based output: can use regular tools before final answer", function()
	local get_weather_called = false

	local agent = luagent.Agent.new({
		model = "gpt-4",
		output_schema = {
			type = "object",
			properties = {
				summary = { type = "string" },
			},
		},
		tools = {
			get_weather = {
				description = "Get weather",
				parameters = {
					type = "object",
					properties = {
						city = { type = "string" },
					},
				},
				func = function(ctx, args)
					get_weather_called = true
					return { temp = 75, city = args.city }
				end,
			},
		},
		http_client = {
			post = function(url, headers, body)
				-- First call: use regular tool
				if not get_weather_called then
					return 200, [[{
						"id": "chatcmpl-1",
						"choices": [{
							"message": {
								"role": "assistant",
								"content": null,
								"tool_calls": [{
									"id": "call_1",
									"type": "function",
									"function": {
										"name": "get_weather",
										"arguments": "{\"city\":\"NYC\"}"
									}
								}]
							}
						}]
					}]]
				else
					-- Second call: use output tool
					return 200, [[{
						"id": "chatcmpl-2",
						"choices": [{
							"message": {
								"role": "assistant",
								"content": null,
								"tool_calls": [{
									"id": "call_2",
									"type": "function",
									"function": {
										"name": "final_answer",
										"arguments": "{\"summary\":\"Weather is 75 in NYC\"}"
									}
								}]
							}
						}]
					}]]
				end
			end,
		},
	})

	local result = agent:run("What's the weather?")

	assert_true(get_weather_called, "Regular tool should be called")
	assert_not_nil(result.data, "Should have structured output")
	assert_eq(result.data.summary, "Weather is 75 in NYC", "Should have final structured answer")
end)

-- Summary
print("\n" .. string.rep("=", 50))
print("Test Results:")
print("  Passed: " .. tests_passed)
print("  Failed: " .. tests_failed)
print("  Total:  " .. (tests_passed + tests_failed))
print(string.rep("=", 50))

if tests_failed > 0 then
	os.exit(1)
else
	print("\nAll tests passed!")
	os.exit(0)
end