Add OllamaEmbeddingService

intitni · intitni · commit 9f137eec048c · 2024-03-02T01:07:01.000+08:00
diff --git a/Pro b/Pro
@@ -1 +1 @@
-Subproject commit de3b6ef6303f29264d347a52dc5c38dfb4dfde6a
+Subproject commit 13a9fde5ea17fda4bd39927428bc7267add18244
diff --git a/Tool/Sources/OpenAIService/APIs/EmbeddingAPIDefinitions.swift b/Tool/Sources/OpenAIService/APIs/EmbeddingAPIDefinitions.swift
@@ -26,5 +26,3 @@ public struct EmbeddingResponse: Decodable {
     public var usage: Usage
 }
 
-
-
diff --git a/Tool/Sources/OpenAIService/APIs/OllamaEmbeddingService.swift b/Tool/Sources/OpenAIService/APIs/OllamaEmbeddingService.swift
@@ -0,0 +1,92 @@
+import AIModel
+import Foundation
+import Logger
+
+struct OllamaEmbeddingService: EmbeddingAPI {
+    struct EmbeddingRequestBody: Encodable {
+        var prompt: String
+        var model: String
+    }
+
+    struct ResponseBody: Decodable {
+        var embedding: [Float]
+    }
+
+    let model: EmbeddingModel
+    let endpoint: String
+
+    public func embed(text: String) async throws -> EmbeddingResponse {
+        guard let url = URL(string: endpoint) else { throw ChatGPTServiceError.endpointIncorrect }
+        var request = URLRequest(url: url)
+        request.httpMethod = "POST"
+        let encoder = JSONEncoder()
+        request.httpBody = try encoder.encode(EmbeddingRequestBody(
+            prompt: text,
+            model: model.info.modelName
+        ))
+        request.setValue("application/json", forHTTPHeaderField: "Content-Type")
+
+        let (result, response) = try await URLSession.shared.data(for: request)
+        guard let response = response as? HTTPURLResponse else {
+            throw ChatGPTServiceError.responseInvalid
+        }
+
+        guard response.statusCode == 200 else {
+            let error = try? JSONDecoder().decode(
+                OpenAIChatCompletionsService.CompletionAPIError.self,
+                from: result
+            )
+            throw error ?? ChatGPTServiceError
+                .otherError(String(data: result, encoding: .utf8) ?? "Unknown Error")
+        }
+
+        let embeddingResponse = try JSONDecoder().decode(ResponseBody.self, from: result)
+        #if DEBUG
+        Logger.service.info("""
+        Embedding usage
+        - number of strings: \(text.count)
+        - prompt tokens: N/A
+        - total tokens: \(embeddingResponse.embedding.count)
+
+        """)
+        #endif
+        return .init(
+            data: [.init(
+                embedding: embeddingResponse.embedding,
+                index: 0,
+                object: model.info.modelName
+            )],
+            model: model.info.modelName,
+            usage: .init(prompt_tokens: 0, total_tokens: embeddingResponse.embedding.count)
+        )
+    }
+
+    public func embed(texts: [String]) async throws -> EmbeddingResponse {
+        try await withThrowingTaskGroup(of: EmbeddingResponse.self) { group in
+            for text in texts {
+                _ = group.addTaskUnlessCancelled {
+                    try await self.embed(text: text)
+                }
+            }
+
+            var result = EmbeddingResponse(
+                data: [],
+                model: model.info.modelName,
+                usage: .init(prompt_tokens: 0, total_tokens: 0)
+            )
+
+            for try await response in group {
+                result.data.append(contentsOf: response.data)
+                result.usage.prompt_tokens += response.usage.prompt_tokens
+                result.usage.total_tokens += response.usage.total_tokens
+            }
+
+            return result
+        }
+    }
+
+    public func embed(tokens: [[Int]]) async throws -> EmbeddingResponse {
+        throw CancellationError()
+    }
+}
+
diff --git a/Tool/Sources/OpenAIService/EmbeddingService.swift b/Tool/Sources/OpenAIService/EmbeddingService.swift
@@ -21,8 +21,10 @@ public struct EmbeddingService {
                 endpoint: configuration.endpoint
             ).embed(text: text)
         case .ollama:
-            #warning("MUSTDO:")
-            fatalError()
+            embeddingResponse = try await OllamaEmbeddingService(
+                model: model,
+                endpoint: configuration.endpoint
+            ).embed(text: text)
         }
 
         #if DEBUG
@@ -50,8 +52,10 @@ public struct EmbeddingService {
                 endpoint: configuration.endpoint
             ).embed(texts: text)
         case .ollama:
-            #warning("MUSTDO:")
-            fatalError()
+            embeddingResponse = try await OllamaEmbeddingService(
+                model: model,
+                endpoint: configuration.endpoint
+            ).embed(texts: text)
         }
 
         #if DEBUG
@@ -79,8 +83,10 @@ public struct EmbeddingService {
                 endpoint: configuration.endpoint
             ).embed(tokens: tokens)
         case .ollama:
-            #warning("MUSTDO:")
-            fatalError()
+            embeddingResponse = try await OllamaEmbeddingService(
+                model: model,
+                endpoint: configuration.endpoint
+            ).embed(tokens: tokens)
         }
 
         #if DEBUG

Original file line number	Diff line number	Diff line change
`@@ -26,5 +26,3 @@ public struct EmbeddingResponse: Decodable {`
`26`	`26`	`public var usage: Usage`
`27`	`27`	`}`
`28`	`28`
`29`		`-`
`30`		`-`