Merge branch 'feature/fix-deep-seek' into hotfix/0.35.4

intitni · intitni · commit 266e7ca9bdf7 · 2025-01-06T15:22:41.000+08:00
diff --git a/Core/Sources/HostApp/AccountSettings/ChatModelManagement/ChatModelEdit.swift b/Core/Sources/HostApp/AccountSettings/ChatModelManagement/ChatModelEdit.swift
@@ -32,6 +32,7 @@ struct ChatModelEdit {
         var openAIOrganizationID: String = ""
         var openAIProjectID: String = ""
         var customHeaders: [ChatModel.Info.CustomHeaderInfo.HeaderField] = []
+        var openAICompatibleSupportsMultipartMessageContent = true
     }
 
     enum Action: Equatable, BindableAction {
@@ -88,20 +89,40 @@ struct ChatModelEdit {
                 let model = ChatModel(state: state)
                 return .run { send in
                     do {
-                        let service = LegacyChatGPTService(
-                            configuration: UserPreferenceChatGPTConfiguration()
-                                .overriding {
-                                    $0.model = model
-                                }
-                        )
-                        let reply = try await service
-                            .sendAndWait(content: "Respond with \"Test succeeded\"")
-                        await send(.testSucceeded(reply ?? "No Message"))
-                        let stream = try await service
-                            .send(content: "Respond with \"Stream response is working\"")
+                        let configuration = UserPreferenceChatGPTConfiguration().overriding {
+                            $0.model = model
+                        }
+                        let service = ChatGPTService(configuration: configuration)
+                        let reply = try await service.send(TemplateChatGPTMemory(
+                            memoryTemplate: .init(messages: [
+                                .init(chatMessage: .init(
+                                    role: .user,
+                                    content: "Respond with \"Test succeeded\""
+                                )),
+                            ]),
+                            configuration: configuration,
+                            functionProvider: NoChatGPTFunctionProvider()
+                        )).asText()
+
+                        await send(.testSucceeded(reply))
+                        let stream = service.send(TemplateChatGPTMemory(
+                            memoryTemplate: .init(messages: [
+                                .init(chatMessage: .init(
+                                    role: .user,
+                                    content: "Respond with \"Stream response is working\""
+                                )),
+                            ]),
+                            configuration: configuration,
+                            functionProvider: NoChatGPTFunctionProvider()
+                        ))
                         var streamReply = ""
                         for try await chunk in stream {
-                            streamReply += chunk
+                            switch chunk {
+                            case let .partialText(text):
+                                streamReply += text
+                            default:
+                                continue
+                            }
                         }
                         await send(.testSucceeded(streamReply))
                     } catch {
@@ -206,7 +227,11 @@ extension ChatModel {
                 ),
                 ollamaInfo: .init(keepAlive: state.ollamaKeepAlive),
                 googleGenerativeAIInfo: .init(apiVersion: state.apiVersion),
-                openAICompatibleInfo: .init(enforceMessageOrder: state.enforceMessageOrder),
+                openAICompatibleInfo: .init(
+                    enforceMessageOrder: state.enforceMessageOrder,
+                    supportsMultipartMessageContent: state
+                        .openAICompatibleSupportsMultipartMessageContent
+                ),
                 customHeaderInfo: .init(headers: state.customHeaders)
             )
         )
@@ -230,7 +255,9 @@ extension ChatModel {
             enforceMessageOrder: info.openAICompatibleInfo.enforceMessageOrder,
             openAIOrganizationID: info.openAIInfo.organizationID,
             openAIProjectID: info.openAIInfo.projectID,
-            customHeaders: info.customHeaderInfo.headers
+            customHeaders: info.customHeaderInfo.headers,
+            openAICompatibleSupportsMultipartMessageContent: info.openAICompatibleInfo
+                .supportsMultipartMessageContent
         )
     }
 }
diff --git a/Core/Sources/HostApp/AccountSettings/ChatModelManagement/ChatModelEditView.swift b/Core/Sources/HostApp/AccountSettings/ChatModelManagement/ChatModelEditView.swift
@@ -322,6 +322,10 @@ struct ChatModelEditView: View {
                     Text("Enforce message order to be user/assistant alternated")
                 }
                 
+                Toggle(isOn: $store.openAICompatibleSupportsMultipartMessageContent) {
+                    Text("Support multi-part message content")
+                }
+                
                 Button("Custom Headers") {
                     isEditingCustomHeader.toggle()
                 }
diff --git a/Tool/Sources/AIModel/ChatModel.swift b/Tool/Sources/AIModel/ChatModel.swift
@@ -46,16 +46,22 @@ public struct ChatModel: Codable, Equatable, Identifiable {
                 self.projectID = projectID
             }
         }
-        
+
         public struct OpenAICompatibleInfo: Codable, Equatable {
             @FallbackDecoding<EmptyBool>
             public var enforceMessageOrder: Bool
+            @FallbackDecoding<EmptyTrue>
+            public var supportsMultipartMessageContent: Bool
 
-            public init(enforceMessageOrder: Bool = false) {
+            public init(
+                enforceMessageOrder: Bool = false,
+                supportsMultipartMessageContent: Bool = true
+            ) {
                 self.enforceMessageOrder = enforceMessageOrder
+                self.supportsMultipartMessageContent = supportsMultipartMessageContent
             }
         }
-        
+
         public struct GoogleGenerativeAIInfo: Codable, Equatable {
             @FallbackDecoding<EmptyString>
             public var apiVersion: String
@@ -64,21 +70,21 @@ public struct ChatModel: Codable, Equatable, Identifiable {
                 self.apiVersion = apiVersion
             }
         }
-        
+
         public struct CustomHeaderInfo: Codable, Equatable {
             public struct HeaderField: Codable, Equatable {
                 public var key: String
                 public var value: String
-                
+
                 public init(key: String, value: String) {
                     self.key = key
                     self.value = value
                 }
             }
-            
+
             @FallbackDecoding<EmptyArray>
             public var headers: [HeaderField]
-            
+
             public init(headers: [HeaderField] = []) {
                 self.headers = headers
             }
@@ -203,3 +209,7 @@ public struct EmptyChatModelOpenAICompatibleInfo: FallbackValueProvider {
 public struct EmptyChatModelCustomHeaderInfo: FallbackValueProvider {
     public static var defaultValue: ChatModel.Info.CustomHeaderInfo { .init() }
 }
+
+public struct EmptyTrue: FallbackValueProvider {
+    public static var defaultValue: Bool { true }
+}
diff --git a/Tool/Sources/OpenAIService/APIs/OpenAIChatCompletionsService.swift b/Tool/Sources/OpenAIService/APIs/OpenAIChatCompletionsService.swift
@@ -299,6 +299,8 @@ actor OpenAIChatCompletionsService: ChatCompletionsStreamAPI, ChatCompletionsAPI
             requestBody,
             endpoint: endpoint,
             enforceMessageOrder: model.info.openAICompatibleInfo.enforceMessageOrder,
+            supportsMultipartMessageContent: model.info.openAICompatibleInfo
+                .supportsMultipartMessageContent,
             canUseTool: model.info.supportsFunctionCalling,
             supportsImage: model.info.supportsImage,
             supportsAudio: model.info.supportsAudio
@@ -651,25 +653,43 @@ extension OpenAIChatCompletionsService.RequestBody {
         _ message: inout Message,
         content: String,
         images: [ChatCompletionsRequestBody.Message.Image],
-        audios: [ChatCompletionsRequestBody.Message.Audio]
+        audios: [ChatCompletionsRequestBody.Message.Audio],
+        supportsMultipartMessageContent: Bool
     ) {
-        switch message.role {
-        case .system, .assistant, .user:
-            let newParts = Self.convertContentPart(
-                content: content,
-                images: images,
-                audios: audios
-            )
-            if case let .contentParts(existingParts) = message.content {
-                message.content = .contentParts(existingParts + newParts)
-            } else {
-                message.content = .contentParts(newParts)
+        if supportsMultipartMessageContent {
+            switch message.role {
+            case .system, .assistant, .user:
+                let newParts = Self.convertContentPart(
+                    content: content,
+                    images: images,
+                    audios: audios
+                )
+                if case let .contentParts(existingParts) = message.content {
+                    message.content = .contentParts(existingParts + newParts)
+                } else {
+                    message.content = .contentParts(newParts)
+                }
+            case .tool, .function:
+                if case let .text(existingText) = message.content {
+                    message.content = .text(existingText + "\n\n" + content)
+                } else {
+                    message.content = .text(content)
+                }
             }
-        case .tool, .function:
-            if case let .text(existingText) = message.content {
-                message.content = .text(existingText + "\n\n" + content)
-            } else {
-                message.content = .text(content)
+        } else {
+            switch message.role {
+            case .system, .assistant, .user:
+                if case let .text(existingText) = message.content {
+                    message.content = .text(existingText + "\n\n" + content)
+                } else {
+                    message.content = .text(content)
+                }
+            case .tool, .function:
+                if case let .text(existingText) = message.content {
+                    message.content = .text(existingText + "\n\n" + content)
+                } else {
+                    message.content = .text(content)
+                }
             }
         }
     }
@@ -678,6 +698,7 @@ extension OpenAIChatCompletionsService.RequestBody {
         _ body: ChatCompletionsRequestBody,
         endpoint: URL,
         enforceMessageOrder: Bool,
+        supportsMultipartMessageContent: Bool,
         canUseTool: Bool,
         supportsImage: Bool,
         supportsAudio: Bool
@@ -702,7 +723,7 @@ extension OpenAIChatCompletionsService.RequestBody {
         model = body.model
 
         // Special case for Claude through OpenRouter
-        
+
         if endpoint.absoluteString.contains("openrouter.ai"), model.hasPrefix("anthropic/") {
             var body = body
             body.model = model.replacingOccurrences(of: "anthropic/", with: "")
@@ -731,7 +752,7 @@ extension OpenAIChatCompletionsService.RequestBody {
             }
             return
         }
-        
+
         // Enforce message order
 
         if enforceMessageOrder {
@@ -752,16 +773,22 @@ extension OpenAIChatCompletionsService.RequestBody {
                             &nonSystemMessages[nonSystemMessages.endIndex - 1],
                             content: message.content,
                             images: supportsImage ? message.images : [],
-                            audios: supportsAudio ? message.audios : []
+                            audios: supportsAudio ? message.audios : [],
+                            supportsMultipartMessageContent: supportsMultipartMessageContent
                         )
                     } else {
                         nonSystemMessages.append(.init(
                             role: .tool,
-                            content: .contentParts(Self.convertContentPart(
-                                content: message.content,
-                                images: supportsImage ? message.images : [],
-                                audios: supportsAudio ? message.audios : []
-                            )),
+                            content: {
+                                if supportsMultipartMessageContent {
+                                    return .contentParts(Self.convertContentPart(
+                                        content: message.content,
+                                        images: supportsImage ? message.images : [],
+                                        audios: supportsAudio ? message.audios : []
+                                    ))
+                                }
+                                return .text(message.content)
+                            }(),
                             tool_calls: message.toolCalls?.map { tool in
                                 MessageToolCall(
                                     id: tool.id,
@@ -780,16 +807,22 @@ extension OpenAIChatCompletionsService.RequestBody {
                             &nonSystemMessages[nonSystemMessages.endIndex - 1],
                             content: message.content,
                             images: supportsImage ? message.images : [],
-                            audios: supportsAudio ? message.audios : []
+                            audios: supportsAudio ? message.audios : [],
+                            supportsMultipartMessageContent: supportsMultipartMessageContent
                         )
                     } else {
                         nonSystemMessages.append(.init(
                             role: .assistant,
-                            content: .contentParts(Self.convertContentPart(
-                                content: message.content,
-                                images: supportsImage ? message.images : [],
-                                audios: supportsAudio ? message.audios : []
-                            ))
+                            content: {
+                                if supportsMultipartMessageContent {
+                                    return .contentParts(Self.convertContentPart(
+                                        content: message.content,
+                                        images: supportsImage ? message.images : [],
+                                        audios: supportsAudio ? message.audios : []
+                                    ))
+                                }
+                                return .text(message.content)
+                            }()
                         ))
                     }
                 case (.user, _):
@@ -798,16 +831,22 @@ extension OpenAIChatCompletionsService.RequestBody {
                             &nonSystemMessages[nonSystemMessages.endIndex - 1],
                             content: message.content,
                             images: supportsImage ? message.images : [],
-                            audios: supportsAudio ? message.audios : []
+                            audios: supportsAudio ? message.audios : [],
+                            supportsMultipartMessageContent: supportsMultipartMessageContent
                         )
                     } else {
                         nonSystemMessages.append(.init(
                             role: .user,
-                            content: .contentParts(Self.convertContentPart(
-                                content: message.content,
-                                images: supportsImage ? message.images : [],
-                                audios: supportsAudio ? message.audios : []
-                            )),
+                            content: {
+                                if supportsMultipartMessageContent {
+                                    return .contentParts(Self.convertContentPart(
+                                        content: message.content,
+                                        images: supportsImage ? message.images : [],
+                                        audios: supportsAudio ? message.audios : []
+                                    ))
+                                }
+                                return .text(message.content)
+                            }(),
                             name: message.name,
                             tool_call_id: message.toolCallId
                         ))
@@ -817,15 +856,25 @@ extension OpenAIChatCompletionsService.RequestBody {
             messages = [
                 .init(
                     role: .system,
-                    content: .contentParts(systemPrompts)
+                    content: {
+                        if supportsMultipartMessageContent {
+                            return .contentParts(systemPrompts)
+                        }
+                        let textParts = systemPrompts.compactMap {
+                            if case let .text(text) = $0 { return text.text }
+                            return nil
+                        }
+
+                        return .text(textParts.joined(separator: "\n\n"))
+                    }()
                 ),
             ] + nonSystemMessages
 
             return
         }
-        
+
         // Default
-        
+
         messages = body.messages.map { message in
             .init(
                 role: {
@@ -840,11 +889,16 @@ extension OpenAIChatCompletionsService.RequestBody {
                         return .tool
                     }
                 }(),
-                content: .contentParts(Self.convertContentPart(
-                    content: message.content,
-                    images: supportsImage ? message.images : [],
-                    audios: supportsAudio ? message.audios : []
-                )),
+                content: {
+                    if supportsMultipartMessageContent {
+                        return .contentParts(Self.convertContentPart(
+                            content: message.content,
+                            images: supportsImage ? message.images : [],
+                            audios: supportsAudio ? message.audios : []
+                        ))
+                    }
+                    return .text(message.content)
+                }(),
                 name: message.name,
                 tool_calls: message.toolCalls?.map { tool in
                     MessageToolCall(

Original file line number	Diff line number	Diff line change
`@@ -322,6 +322,10 @@ struct ChatModelEditView: View {`
`322`	`322`	`Text("Enforce message order to be user/assistant alternated")`
`323`	`323`	`}`
`324`	`324`
	`325`	`+ Toggle(isOn: $store.openAICompatibleSupportsMultipartMessageContent) {`
	`326`	`+ Text("Support multi-part message content")`
	`327`	`+ }`
	`328`	`+`
`325`	`329`	`Button("Custom Headers") {`
`326`	`330`	`isEditingCustomHeader.toggle()`
`327`	`331`	`}`