Merge pull request #4 from Recouse/feature/responses

Recouse · web-flow · commit 81bb9d4344c8 · 2025-08-08T14:56:14.000+03:00
Responses improvements
diff --git a/Sources/OpenAI/Common/Content.swift b/Sources/OpenAI/Common/Content.swift
@@ -0,0 +1,118 @@
+//
+//  Content.swift
+//  OpenAI
+//
+//  Created by Firdavs Khaydarov on 08/08/2025.
+//
+
+public enum Content: Encodable, Sendable {
+    case inputText(TextInput)
+    case inputImage(ImageInput)
+    case inputFile(FileInput)
+
+    enum TypeCodingKeys: String, CodingKey {
+        case type
+    }
+
+    public func encode(to encoder: any Encoder) throws {
+        var container = encoder.singleValueContainer()
+
+        switch self {
+        case .inputText(let textInput):
+            try container.encode(textInput)
+        case .inputImage(let imageInput):
+            try container.encode(imageInput)
+        case .inputFile(let fileInput):
+            try container.encode(fileInput)
+        }
+
+    }
+}
+
+/// A text input to the model.
+public struct TextInput: Codable, Sendable {
+    /// The text input to the model.
+    public let text: String
+
+    /// The type of the input item. Always `input_text`.
+    public let type: ContentType
+
+    enum CodingKeys: CodingKey {
+        case text
+        case type
+    }
+
+    public init(text: String) {
+        self.text = text
+        self.type = .inputText
+    }
+}
+
+/// An image input to the model.
+public struct ImageInput: Codable, Sendable {
+    /// The detail level of the image to be sent to the model.
+    ///
+    /// One of `high`, `low`, or `auto`. Defaults to `auto`.
+    public let detail: ImageDetail
+
+    /// The type of the input item. Always `input_image`.
+    public let type: ContentType
+
+    /// The ID of the file to be sent to the model.
+    public let fileId: String?
+
+    /// The URL of the image to be sent to the model.
+    ///
+    /// A fully qualified URL or base64 encoded image in a data URL.
+    public let imageUrl: String?
+
+    public init(detail: ImageDetail = .auto, fileId: String? = nil, imageUrl: String? = nil) {
+        self.detail = detail
+        self.type = .inputImage
+        self.fileId = fileId
+        self.imageUrl = imageUrl
+    }
+}
+
+/// A file input to the model.
+public struct FileInput: Codable, Sendable {
+    /// The type of the input item. Always `input_file`.
+    public let type: ContentType
+
+    /// The content of the file to be sent to the model.
+    public let fileData: String?
+
+    /// The ID of the file to be sent to the model.
+    public let fileId: String?
+
+    /// The URL of the file to be sent to the model.
+    public let fileUrl: String?
+
+    /// The name of the file to be sent to the model.
+    public let filename: String?
+
+    public init(
+        fileData: String? = nil,
+        fileId: String? = nil,
+        fileUrl: String? = nil,
+        filename: String? = nil
+    ) {
+        self.type = .inputFile
+        self.fileData = fileData
+        self.fileId = fileId
+        self.fileUrl = fileUrl
+        self.filename = filename
+    }
+}
+
+public enum ContentType: String, Codable, Sendable {
+    case inputText = "input_text"
+    case outputText = "output_text"
+    case inputFile = "input_file"
+    case inputImage = "input_image"
+}
+
+
+public enum ImageDetail: String, Codable, Sendable {
+    case auto, low, high
+}
diff --git a/Sources/OpenAI/Common/Prompt.swift b/Sources/OpenAI/Common/Prompt.swift
@@ -0,0 +1,27 @@
+//
+//  Prompt.swift
+//  OpenAI
+//
+//  Created by Firdavs Khaydarov on 08/08/2025.
+//
+
+// TODO: Implement file input https://platform.openai.com/docs/guides/text#reusable-prompts
+
+public struct Prompt: Encodable, Sendable {
+    /// The unique identifier of the prompt template to use.
+    public let id: String
+
+    /// Optional map of values to substitute in for variables in your prompt.
+    ///
+    /// The substitution values can either be strings, or other Response input types like images or files.
+    public let variables: [String: String]?
+
+    /// Optional version of the prompt template.
+    public let version: String?
+
+    public init(id: String, variables: [String: String]? = nil, version: String? = nil) {
+        self.id = id
+        self.variables = variables
+        self.version = version
+    }
+}
diff --git a/Sources/OpenAI/Model.swift b/Sources/OpenAI/Model.swift
@@ -5,8 +5,86 @@
 //  Created by Firdavs Khaydarov on 01/08/2025.
 //
 
+/// Model type to define OpenAI models.
+///
+/// For more information about models and their capabilities visit https://platform.openai.com/docs/models
 public typealias Model = String
 
+// MARK: - o-series
+
+extension Model {
+    /// o1 models think before they answer, producing a long internal chain of thought before responding to the user.
+    ///
+    /// * Context window: 200,000
+    /// * Max output tokens: 100,000
+    public static let o1: Model = "o1"
+
+    /// The o1-pro model uses more compute to think harder and provide consistently better answers.
+    ///
+    /// o1-pro is available in the Responses API only to enable support for multi-turn model
+    /// interactions before responding to API requests, and other advanced API features in the future.
+    ///
+    /// * Context window: 200,000
+    /// * Max output tokens: 100,000
+    public static let o1_pro: Model = "o1-pro"
+
+    /// o3 is a well-rounded and powerful model across domains.
+    ///
+    /// Use it to think through multi-step problems that involve analysis across text, code, and images.
+    ///
+    /// * Context window: 200,000
+    /// * Max output tokens: 100,000
+    public static let o3: Model = "o3"
+
+    /// The o3-pro model uses more compute to think harder and provide consistently better answers.
+    ///
+    /// o3-pro is available in the Responses API only to enable support for multi-turn model
+    /// interactions before responding to API requests, and other advanced API features in the future.
+    /// Since o3-pro is designed to tackle tough problems, some requests may take several minutes to
+    /// finish. To avoid timeouts, try using background mode.
+    ///
+    /// * Context window: 200,000
+    /// * Max output tokens: 100,000
+    public static let o3_pro: Model = "o3-pro"
+
+    /// o3-mini is our newest small reasoning model, providing high intelligence at the same cost
+    /// and latency targets of o1-mini.
+    ///
+    /// o3-mini supports key developer features, like Structured Outputs, function calling, and Batch API.
+    ///
+    /// * Context window: 200,000
+    /// * Max output tokens: 100,000
+    public static let o3_mini: Model = "o3-mini"
+
+    /// o3-deep-research is the most advanced model for deep research, designed to tackle complex,
+    /// multi-step research tasks.
+    ///
+    /// It can search and synthesize information from across the internet as well as from your own data—brought in through MCP connectors.
+    ///
+    /// * Context window: 200,000
+    /// * Max output tokens: 100,000
+    public static let o3_deep_research: Model = "o3-deep-research"
+
+    /// o4-mini is the latest small o-series model.
+    ///
+    /// It's optimized for fast, effective reasoning with exceptionally efficient performance in
+    /// coding and visual tasks.
+    ///
+    /// * Context window: 200,000
+    /// * Max output tokens: 100,000
+    public static let o4_mini: Model = "o4-mini"
+
+    /// o4-mini-deep-research is a faster, more affordable deep research model—ideal for tackling
+    /// complex, multi-step research tasks.
+    ///
+    /// It can search and synthesize information from across the internet as well as from your own
+    /// data, brought in through MCP connectors.
+    ///
+    /// * Context window: 200,000
+    /// * Max output tokens: 100,000
+    public static let o4_mini_deep_research: Model = "o4-mini-deep-research"
+}
+
 // MARK: - GPT-5
 
 extension Model {
diff --git a/Sources/OpenAI/Responses/ResponsesBody.swift b/Sources/OpenAI/Responses/ResponsesBody.swift
@@ -8,13 +8,13 @@
 import Foundation
 
 public extension Responses {
-    struct Body: Codable {
+    struct Body: Encodable {
         /// Whether to run the model response in the background.
         public var background: Bool?
         /// Specify additional output data to include in the model response.
         public var include: [AdditionalOutput]?
-        ///
-        public var input: String?
+        /// Text, image, or file inputs to the model, used to generate a response.
+        public var input: [Input]?
         /// A system (or developer) message inserted into the model's context.
         ///
         /// When using along with `previous_response_id`, the instructions from a previous response
@@ -45,8 +45,8 @@ public extension Responses {
         public var parallelToolCalls: Bool?
         /// The unique ID of the previous response to the model. Use this to create multi-turn conversations.
         public var previousResponseId: String?
-        ///
-        public var prompt: String?
+        /// Reference to a prompt template and its variables.
+        public var prompt: Prompt?
         /// Used by OpenAI to cache responses for similar requests to optimize your cache hit rates.
         public var promptCacheKey: String?
         ///
@@ -122,5 +122,14 @@ public extension Responses {
             /// an organization is enrolled in the zero data retention program).
             case reasoningEncryptedContent = "reasoning.encrypted_content"
         }
+
+        public struct Input: Encodable, Sendable {
+            /// The role of the message input. One of `user`, `assistant`, `system`, or `developer`.
+            public let role: Role
+
+            /// Text, image, or audio input to the model, used to generate a response. Can also contain
+            /// previous assistant responses.
+            public let content: [Content]
+        }
     }
 }
diff --git a/Sources/OpenAI/Responses/ResponsesWrapper.swift b/Sources/OpenAI/Responses/ResponsesWrapper.swift
@@ -12,15 +12,15 @@ public struct ResponsesWrapper {
     public func create(
         background: Bool? = nil,
         include: [Responses.Body.AdditionalOutput]? = nil,
-        input: String? = nil,
+        input: [Responses.Body.Input]? = nil,
         instructions: String? = nil,
         maxOutputTokens: Int? = nil,
         maxToolCalls: Int? = nil,
         metadata: [String : String]? = nil,
         model: Model? = nil,
         parallelToolCalls: Bool? = nil,
         previousResponseId: String? = nil,
-        prompt: String? = nil,
+        prompt: Prompt? = nil,
         promptCacheKey: String? = nil,
         reasoning: String? = nil,
         safetyIdentifier: String? = nil,
@@ -65,15 +65,15 @@ public struct ResponsesWrapper {
     public func createStream(
         background: Bool? = nil,
         include: [Responses.Body.AdditionalOutput]? = nil,
-        input: String? = nil,
+        input: [Responses.Body.Input]? = nil,
         instructions: String? = nil,
         maxOutputTokens: Int? = nil,
         maxToolCalls: Int? = nil,
         metadata: [String : String]? = nil,
         model: Model? = nil,
         parallelToolCalls: Bool? = nil,
         previousResponseId: String? = nil,
-        prompt: String? = nil,
+        prompt: Prompt? = nil,
         promptCacheKey: String? = nil,
         reasoning: String? = nil,
         safetyIdentifier: String? = nil,