Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add embeddings #11

Merged
merged 1 commit into from
Apr 8, 2023
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -0,0 +1,19 @@
import Foundation

public struct EmbeddingResponseDataModel: Decodable {
public let object: String
public let data: [EmbeddingDataModel]
public let model: String
public let usage: EmbeddingUsageDataModel
}

public struct EmbeddingDataModel: Decodable {
public let object: String
public let embedding: [Float]
public let index: Int
}

public struct EmbeddingUsageDataModel: Decodable {
public let promptTokens: Int
public let totalTokens: Int
}
7 changes: 7 additions & 0 deletions Sources/SwiftOpenAI/OpenAI/DataModels/OpenAIModelType.swift
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,7 @@ public enum OpenAIModelType {
case gpt4(GPT4)
case gpt3_5(GPT3_5)
case edit(EditModel)
case embedding(EmbeddingModel)

var name: String {
switch self {
Expand All @@ -13,6 +14,8 @@ public enum OpenAIModelType {
return gpt3_5Model.rawValue
case .edit(let editModel):
return editModel.rawValue
case .embedding(let embeddingModel):
return embeddingModel.rawValue
}
}
}
Expand All @@ -36,3 +39,7 @@ public enum EditModel: String {
case text_davinci_edit_001 = "text-davinci-edit-001"
case code_davinci_edit_001 = "code-davinci-edit-001"
}

public enum EmbeddingModel: String {
case text_embedding_ada_002 = "text-embedding-ada-002"
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
import Foundation

struct CreateEmbeddingsEndpoint: Endpoint {
private let model: OpenAIModelType
private let input: String

var method: HTTPMethod {
.POST
}

var path: String = "embeddings"

init(model: OpenAIModelType,
input: String) {
self.model = model
self.input = input
}

var parameters: [String : Any]? {
["model": self.model.name as Any,
"input": self.input as Any
]
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,8 @@ enum OpenAIEndpoints {
numberOfImages: Int,
size: ImageSize)

case embeddings(model: OpenAIModelType, input: String)

public var endpoint: Endpoint {
switch self {
case .listModels:
Expand All @@ -37,6 +39,9 @@ enum OpenAIEndpoints {
return CreateImageEndpoint(prompt: prompt,
numberOfImages: numberOfImages,
size: size)
case .embeddings(model: let model, input: let input):
return CreateEmbeddingsEndpoint(model: model,
input: input)
}
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,40 @@
import Foundation

protocol EmbeddingsRequestProtocol {
func execute(api: API,
apiKey: String,
model: OpenAIModelType,
input: String) async throws -> EmbeddingResponseDataModel?
}

final public class EmbeddingsRequest: EmbeddingsRequestProtocol {
public typealias Init = (_ api: API,
_ apiKey: String,
_ model: OpenAIModelType,
_ input: String) async throws -> EmbeddingResponseDataModel?

public init() { }

public func execute(api: API,
apiKey: String,
model: OpenAIModelType,
input: String) async throws -> EmbeddingResponseDataModel? {
var endpoint = OpenAIEndpoints.embeddings(model: model, input: input).endpoint
api.routeEndpoint(&endpoint, environment: OpenAIEnvironmentV1())

var urlRequest = api.buildURLRequest(endpoint: endpoint)
api.addHeaders(urlRequest: &urlRequest,
headers: ["Content-Type" : "application/json",
"Authorization" : "Bearer \(apiKey)"])

let result = await api.execute(with: urlRequest)

let jsonDecoder = JSONDecoder()
jsonDecoder.keyDecodingStrategy = .convertFromSnakeCase

return try api.parse(result,
type: EmbeddingResponseDataModel.self,
jsonDecoder: jsonDecoder,
errorType: OpenAIAPIError.self)
}
}
12 changes: 11 additions & 1 deletion Sources/SwiftOpenAI/OpenAI/SwiftOpenAI.swift
Original file line number Diff line number Diff line change
Expand Up @@ -19,6 +19,9 @@ protocol OpenAIProtocol {
instruction: String) async throws -> EditsDataModel?

func createImages(prompt: String, numberOfImages: Int, size: ImageSize) async throws -> CreateImageDataModel?

func embeddings(model: OpenAIModelType,
input: String) async throws -> EmbeddingResponseDataModel?
}

public class SwiftOpenAI: OpenAIProtocol {
Expand All @@ -31,6 +34,7 @@ public class SwiftOpenAI: OpenAIProtocol {
private let createChatCompletionsStreamRequest: CreateChatCompletionsStreamRequest.Init
private let editsRequest: EditsRequest.Init
private let createImagesRequest: CreateImagesRequest.Init
private let embeddingRequest: EmbeddingsRequest.Init

public init(api: API = API(),
apiKey: String,
Expand All @@ -39,7 +43,8 @@ public class SwiftOpenAI: OpenAIProtocol {
createChatCompletionsRequest: @escaping CreateChatCompletionsRequest.Init = CreateChatCompletionsRequest().execute,
createChatCompletionsStreamRequest: @escaping CreateChatCompletionsStreamRequest.Init = CreateChatCompletionsStreamRequest().execute,
editsRequest: @escaping EditsRequest.Init = EditsRequest().execute,
createImagesRequest: @escaping CreateImagesRequest.Init = CreateImagesRequest().execute) {
createImagesRequest: @escaping CreateImagesRequest.Init = CreateImagesRequest().execute,
embeddingRequest: @escaping EmbeddingsRequest.Init = EmbeddingsRequest().execute) {
self.api = api
self.apiKey = apiKey
self.listModelsRequest = listModelsRequest
Expand All @@ -48,6 +53,7 @@ public class SwiftOpenAI: OpenAIProtocol {
self.createChatCompletionsStreamRequest = createChatCompletionsStreamRequest
self.editsRequest = editsRequest
self.createImagesRequest = createImagesRequest
self.embeddingRequest = embeddingRequest
}

public func listModels() async throws -> ModelListDataModel? {
Expand Down Expand Up @@ -79,4 +85,8 @@ public class SwiftOpenAI: OpenAIProtocol {
public func createImages(prompt: String, numberOfImages: Int, size: ImageSize) async throws -> CreateImageDataModel? {
try await createImagesRequest(api, apiKey, prompt, numberOfImages, size)
}

public func embeddings(model: OpenAIModelType, input: String) async throws -> EmbeddingResponseDataModel? {
try await embeddingRequest(api, apiKey, model, input)
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,52 @@
import XCTest
@testable import SwiftOpenAI

final class EmbeddingAPIClientSpec: XCTestCase {
private var sut: EmbeddingsRequestProtocol!
private let model: OpenAIModelType = .embedding(.text_embedding_ada_002)
private let apiKey = "1234567890"
private let input = "What day of the wek is it?"

func testAsyncAPIRequest_ParsesValidJSONToChatCompletionsDataModel() async throws {
let json = loadJSON(name: "embeddings")

let api = API(requester: RequesterMock())
let endpoint = OpenAIEndpoints.embeddings(model: model, input: input).endpoint

sut = EmbeddingsRequest()

stubHTTP(model: model,
endpoint: endpoint,
json: json,
statusCode: 200)

do {
let dataModel = try await sut.execute(api: api, apiKey: apiKey, model: model, input: input)
XCTAssertNotNil(dataModel)
XCTAssertEqual(dataModel?.object, "list")
XCTAssertEqual(dataModel?.model, "text-embedding-ada-002")
XCTAssertEqual(dataModel?.data[0].embedding.count, 1536)
XCTAssertEqual(dataModel?.data[0].object, "embedding")
XCTAssertEqual(dataModel?.data[0].embedding[0], 0.0023064255)
XCTAssertEqual(dataModel?.data[0].embedding[1], -0.009327292)
XCTAssertEqual(dataModel?.usage.promptTokens, 8)
XCTAssertEqual(dataModel?.usage.totalTokens, 8)
} catch {
XCTFail()
}
}

private func stubHTTP(model: OpenAIModelType,
endpoint: Endpoint,
json: Data,
statusCode: Int) {

URLProtocolMock.completionHandler = { request in
let response = HTTPURLResponse(url: URL(string: endpoint.path)!,
statusCode: statusCode,
httpVersion: nil,
headerFields: [:])!
return (response, json)
}
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,21 @@
import XCTest
@testable import SwiftOpenAI

final class EmbeddingEndpointSpec: XCTestCase {
func testEndpointCompletions_WithDavinciModelInput_CreatesCorrectEndpointParameters() throws {
let model: OpenAIModelType = .embedding(.text_embedding_ada_002)
let input = "What day of the wek is it?"

let sut = OpenAIEndpoints.embeddings(model: model, input: input).endpoint

let modelParameter = sut.parameters!["model"] as! String
let inputParameter = sut.parameters!["input"] as! String

XCTAssertEqual(sut.path, "embeddings")
XCTAssertEqual(sut.method, .POST)
XCTAssertEqual(sut.parameters?.count, 2)
XCTAssertEqual(modelParameter, model.name)
XCTAssertEqual(inputParameter, input)
}
}

Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
import XCTest
@testable import SwiftOpenAI

final class EmbeddingParserSpec: XCTestCase {
private var api = API()

func testAsyncAPIRequest_ParsesValidJSONToEditsDataModel() async throws {
let jsonData = loadJSON(name: "embeddings")

let jsonDecoder = JSONDecoder()
jsonDecoder.keyDecodingStrategy = .convertFromSnakeCase

let dataModel = try! api.parse(.success(jsonData), type: EmbeddingResponseDataModel.self, jsonDecoder: jsonDecoder, errorType: OpenAIAPIError.self)

XCTAssertNotNil(dataModel)
XCTAssertEqual(dataModel?.object, "list")
XCTAssertEqual(dataModel?.model, "text-embedding-ada-002")
XCTAssertEqual(dataModel?.data[0].embedding.count, 1536)
XCTAssertEqual(dataModel?.data[0].object, "embedding")
XCTAssertEqual(dataModel?.data[0].embedding[0], 0.0023064255)
XCTAssertEqual(dataModel?.data[0].embedding[1], -0.009327292)
XCTAssertEqual(dataModel?.usage.promptTokens, 8)
XCTAssertEqual(dataModel?.usage.totalTokens, 8)
}
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
import XCTest
@testable import SwiftOpenAI

final class EmbeddingRequestSpec: XCTestCase {
private let api = API()

func testRequest_CreatedWithCorrectHeaders() throws {
let apiKey = "1234567890"
let model: OpenAIModelType = .embedding(.text_embedding_ada_002)
let input = "What day of the wek is it?"

var endpoint = OpenAIEndpoints.embeddings(model: model, input: input).endpoint

api.routeEndpoint(&endpoint, environment: OpenAIEnvironmentV1())

var sut = api.buildURLRequest(endpoint: endpoint)
api.addHeaders(urlRequest: &sut,
headers: ["Content-Type" : "application/json",
"Authorization" : "Bearer \(apiKey)"])

XCTAssertEqual(sut.allHTTPHeaderFields?.count, 2)
XCTAssertEqual(sut.allHTTPHeaderFields?["Content-Type"], "application/json")
XCTAssertEqual(sut.allHTTPHeaderFields?["Authorization"], "Bearer 1234567890")
}
}
17 changes: 17 additions & 0 deletions Tests/SwiftOpenAITests/OpenAITests/Unit Tests/JSON/embeddings.json

Large diffs are not rendered by default.