Add support for OpenAI embeddings (#106)

lzell · web-flow · commit 061514a1a880 · 2025-02-16T22:03:11.000-08:00
diff --git a/README.md b/README.md
@@ -817,18 +817,78 @@ This example it taken from OpenAI's [function calling guide](https://platform.op
     }
 ```
 
+### How to get embeddings using OpenAI
+
+```swift
+    import AIProxy
+
+    /* Uncomment for BYOK use cases */
+    // let openAIService = AIProxy.openAIDirectService(
+    //     unprotectedAPIKey: "your-openai-key"
+    // )
+
+    /* Uncomment for all other production use cases */
+    // let openAIService = AIProxy.openAIService(
+    //     partialKey: "partial-key-from-your-developer-dashboard",
+    //     serviceURL: "service-url-from-your-developer-dashboard"
+    // )
+
+    let requestBody = OpenAIEmbeddingRequestBody(
+        input: .text("hello world"),
+        model: "text-embedding-3-small"
+    )
+
+    // Or, for multiple embeddings from strings:
+
+    /*
+    let requestBody = OpenAIEmbeddingRequestBody(
+        input: .textArray([
+            "hello world",
+            "hola mundo"
+        ]),
+        model: "text-embedding-3-small"
+    )
+    */
+
+    // Or, for multiple embeddings from tokens:
+
+    /*
+    let requestBody = OpenAIEmbeddingRequestBody(
+        input: .intArray([0,1,2]),
+        model: "text-embedding-3-small"
+    )
+    */
+
+    do {
+        let response = try await openAIService.embeddingRequest(body: requestBody)
+        print(
+            """
+            The response contains \(response.embeddings.count) embeddings.
+
+            The first vector starts with \(response.embeddings.first?.vector.prefix(10) ?? [])
+            """
+        )
+    } catch AIProxyError.unsuccessfulRequest(let statusCode, let responseBody) {
+        print("Received \(statusCode) status code with response body: \(responseBody)")
+    } catch {
+        print("Could not perform embedding request to OpenAI: \(error.localizedDescription)")
+    }
+```
+
+
 ### How to use OpenAI through an Azure deployment
 
 You can use all of the OpenAI snippets aboves with one change. Initialize the OpenAI service with:
 
+```swift
     import AIProxy
 
     let openAIService = AIProxy.openAIService(
         partialKey: "partial-key-from-your-developer-dashboard",
         serviceURL: "service-url-from-your-developer-dashboard",
         requestFormat: .azureDeployment(apiVersion: "2024-06-01")
     )
-
+```
 
 ***
 
diff --git a/Sources/AIProxy/AIProxy.swift b/Sources/AIProxy/AIProxy.swift
@@ -13,7 +13,7 @@ let aiproxyLogger = Logger(
 public struct AIProxy {
 
     /// The current sdk version
-    public static let sdkVersion = "0.70.0"
+    public static let sdkVersion = "0.71.0"
 
     /// - Parameters:
     ///   - partialKey: Your partial key is displayed in the AIProxy dashboard when you submit your provider's key.
diff --git a/Sources/AIProxy/OpenAI/OpenAIDirectService.swift b/Sources/AIProxy/OpenAI/OpenAIDirectService.swift
@@ -187,6 +187,29 @@ open class OpenAIDirectService: OpenAIService, DirectService {
         return try await self.makeRequestAndDeserializeResponse(request)
     }
 
+    /// Get a vector representation of a given input that can be easily consumed by machine learning models and algorithms. Related guide:
+    /// https://platform.openai.com/docs/guides/embeddings
+    /// - Parameters:
+    ///   - body: The request body to send to aiproxy and openai. See this reference:
+    ///           https://platform.openai.com/docs/api-reference/embeddings/create
+    /// - Returns: An embedding response. See this reference:
+    ///            https://platform.openai.com/docs/api-reference/embeddings/object
+    public func embeddingRequest(
+        body: OpenAIEmbeddingRequestBody
+    ) async throws -> OpenAIEmbeddingResponseBody {
+        let request = try AIProxyURLRequest.createDirect(
+            baseURL: "https://api.openai.com",
+            path: self.resolvedPath("embeddings"),
+            body: try body.serialize(),
+            verb: .post,
+            contentType: "application/json",
+            additionalHeaders: [
+                "Authorization": "Bearer \(self.unprotectedAPIKey)"
+            ]
+        )
+        return try await self.makeRequestAndDeserializeResponse(request)
+    }
+
     private func resolvedPath(_ common: String) -> String {
         assert(common[common.startIndex] != "/")
         switch self.requestFormat {
diff --git a/Sources/AIProxy/OpenAI/OpenAIEmbeddingRequestBody.swift b/Sources/AIProxy/OpenAI/OpenAIEmbeddingRequestBody.swift
@@ -0,0 +1,112 @@
+//
+//  OpenAIEmbeddingRequestBody.swift
+//  AIProxy
+//
+//  Created by Lou Zell on 2/16/25.
+//
+
+/// From OpenAI's docs:
+///
+/// > Embeddings are a numerical representation of text that can be used to measure the
+/// relatedness between two pieces of text. Embeddings are useful for search, clustering,
+/// recommendations, anomaly detection, and classification tasks. You can read more about our
+/// latest embedding models in the announcement blog post."
+///
+/// References:
+/// - https://openai.com/blog/new-embedding-models-and-api-updates
+/// - https://platform.openai.com/docs/api-reference/embeddings/create
+public struct OpenAIEmbeddingRequestBody: Encodable {
+
+    // Required
+
+    /// Input text to embed, encoded as a string or array of tokens. To embed multiple inputs
+    /// in a single request, pass an array of strings or array of token arrays. The input must
+    /// not exceed the max input tokens for the model (8192 tokens for text-embedding-ada-002),
+    /// cannot be an empty string, and any array must be 2048 dimensions or less. Example
+    /// Python code for counting tokens. Some models may also impose a limit on total number of
+    /// tokens summed across inputs.
+    public let input: EmbeddingInput
+
+    /// ID of the model to use.
+    /// See the model list here: https://platform.openai.com/docs/models#embeddings
+    ///
+    /// text-embedding-3-large
+    /// Most capable embedding model for both english and non-english tasks.
+    /// Output dimension:  3,072
+    ///
+    /// text-embedding-3-small
+    /// Increased performance over 2nd generation ada embedding model.
+    /// Output dimension: 1,536
+    ///
+    /// text-embedding-ada-002
+    /// Most capable 2nd generation embedding model, replacing 16 first generation models.
+    /// Output dimension: 1,536
+    public let model: String
+
+    // Optional
+
+    /// The format to return the embeddings in.
+    /// Defaults to float
+    public let encodingFormat: EncodingFormat?
+
+    /// The number of dimensions the resulting output embeddings should have. Only supported in
+    /// `text-embedding-3` and later models.
+    public let dimensions: Int?
+
+    /// A unique identifier representing your end-user, which can help OpenAI to monitor and
+    /// detect abuse.
+    public let user: String?
+
+    private enum CodingKeys: String, CodingKey {
+        case input
+        case model
+
+        case encodingFormat = "encoding_format"
+        case dimensions
+        case user
+    }
+
+    // This memberwise initializer is autogenerated.
+    // To regenerate, use `cmd-shift-a` > Generate Memberwise Initializer
+    // To format, place the cursor in the initializer's parameter list and use `ctrl-m`
+    public init(
+        input: OpenAIEmbeddingRequestBody.EmbeddingInput,
+        model: String,
+        encodingFormat: OpenAIEmbeddingRequestBody.EncodingFormat? = nil,
+        dimensions: Int? = nil,
+        user: String? = nil
+    ) {
+        self.input = input
+        self.model = model
+        self.encodingFormat = encodingFormat
+        self.dimensions = dimensions
+        self.user = user
+    }
+}
+
+extension OpenAIEmbeddingRequestBody {
+    public enum EmbeddingInput: Encodable {
+        case text(String)
+        case textArray([String])
+        case intArray([Int])
+
+        public func encode(to encoder: any Encoder) throws {
+            var container = encoder.singleValueContainer()
+            switch self {
+            case .text(let text):
+                try container.encode(text)
+            case .textArray(let arr):
+                try container.encode(arr)
+            case .intArray(let arr):
+                try container.encode(arr)
+            }
+        }
+    }
+}
+
+extension OpenAIEmbeddingRequestBody {
+    public enum EncodingFormat: String, Encodable {
+        case float
+        case base64
+    }
+}
diff --git a/Sources/AIProxy/OpenAI/OpenAIEmbeddingResponseBody.swift b/Sources/AIProxy/OpenAI/OpenAIEmbeddingResponseBody.swift
@@ -0,0 +1,56 @@
+//
+//  OpenAIEmbeddingResponseBody.swift
+//  AIProxy
+//
+//  Created by Lou Zell on 2/16/25.
+//
+
+/// https://platform.openai.com/docs/api-reference/embeddings/object
+public struct OpenAIEmbeddingResponseBody: Decodable {
+    public let embeddings: [Embedding]
+    public let model: String?
+    public let usage: Usage?
+
+    private enum CodingKeys: CodingKey {
+        case data
+        case model
+        case usage
+    }
+
+    public init(from decoder: any Decoder) throws {
+        let container = try decoder.container(keyedBy: CodingKeys.self)
+        self.embeddings = try container.decode([Embedding].self, forKey: .data)
+        self.model = try container.decodeIfPresent(String.self, forKey: .model)
+        self.usage = try container.decodeIfPresent(Usage.self, forKey: .usage)
+    }
+}
+
+extension OpenAIEmbeddingResponseBody {
+    public struct Embedding: Decodable {
+        public let vector: [Double]
+        public let index: Int?
+
+        private enum CodingKeys: CodingKey {
+            case embedding
+            case index
+        }
+
+        public init(from decoder: any Decoder) throws {
+            let container = try decoder.container(keyedBy: CodingKeys.self)
+            self.vector = try container.decode([Double].self, forKey: .embedding)
+            self.index = try container.decodeIfPresent(Int.self, forKey: .index)
+        }
+    }
+}
+
+extension OpenAIEmbeddingResponseBody {
+    public struct Usage: Decodable {
+        public let promptTokens: Int
+        public let totalTokens: Int
+
+        private enum CodingKeys: String, CodingKey {
+            case promptTokens = "prompt_tokens"
+            case totalTokens = "total_tokens"
+        }
+    }
+}
diff --git a/Sources/AIProxy/OpenAI/OpenAIProxiedService.swift b/Sources/AIProxy/OpenAI/OpenAIProxiedService.swift
@@ -188,6 +188,29 @@ open class OpenAIProxiedService: OpenAIService, ProxiedService {
         return try await self.makeRequestAndDeserializeResponse(request)
     }
 
+    /// Get a vector representation of a given input that can be easily consumed by machine learning models and algorithms. Related guide:
+    /// https://platform.openai.com/docs/guides/embeddings
+    /// - Parameters:
+    ///   - body: The request body to send to aiproxy and openai. See this reference:
+    ///           https://platform.openai.com/docs/api-reference/embeddings/create
+    /// - Returns: An embedding response. See this reference:
+    ///            https://platform.openai.com/docs/api-reference/embeddings/object
+    public func embeddingRequest(
+        body: OpenAIEmbeddingRequestBody
+    ) async throws -> OpenAIEmbeddingResponseBody {
+        let request = try await AIProxyURLRequest.create(
+            partialKey: self.partialKey,
+            serviceURL: self.serviceURL ?? legacyURL,
+            clientID: self.clientID,
+            proxyPath: self.resolvedPath("embeddings"),
+            body: try body.serialize(),
+            verb: .post,
+            contentType: "application/json"
+        )
+        return try await self.makeRequestAndDeserializeResponse(request)
+    }
+
+
     private func resolvedPath(_ common: String) -> String {
         assert(common[common.startIndex] != "/")
         switch self.requestFormat {
diff --git a/Sources/AIProxy/OpenAI/OpenAIService.swift b/Sources/AIProxy/OpenAI/OpenAIService.swift
@@ -78,6 +78,17 @@ public protocol OpenAIService {
     func moderationRequest(
         body: OpenAIModerationRequestBody
     ) async throws -> OpenAIModerationResponseBody
+
+    /// Get a vector representation of a given input that can be easily consumed by machine learning models and algorithms. Related guide:
+    /// https://platform.openai.com/docs/guides/embeddings
+    /// - Parameters:
+    ///   - body: The request body to send to aiproxy and openai. See this reference:
+    ///           https://platform.openai.com/docs/api-reference/embeddings/create
+    /// - Returns: An embedding response. See this reference:
+    ///            https://platform.openai.com/docs/api-reference/embeddings/object
+    func embeddingRequest(
+        body: OpenAIEmbeddingRequestBody
+    ) async throws -> OpenAIEmbeddingResponseBody
 }
 
 extension OpenAIService {