feat: Add vitest tests and zod validation for streaming responses

ericc-ch · ericc-ch · commit 19ba330ab7d2 · 2025-03-02T15:38:45.000+07:00
diff --git a/bun.lock b/bun.lock
diff --git a/package.json b/package.json
@@ -7,8 +7,8 @@
     "github-copilot",
     "openai-compatible"
   ],
-  "homepage": "https://github.com/ericc-ch/copilot-api",
   "bugs": "https://github.com/ericc-ch/copilot-api/issues",
+  "homepage": "https://github.com/ericc-ch/copilot-api",
   "repository": {
     "type": "git",
     "url": "git+https://github.com/ericc-ch/copilot-api.git"
@@ -29,7 +29,8 @@
     "prepack": "bun run build",
     "prepare": "simple-git-hooks",
     "release": "bumpp && bun publish --access public",
-    "start": "NODE_ENV=production bun run ./src/main.ts"
+    "start": "NODE_ENV=production bun run ./src/main.ts",
+    "test": "vitest"
   },
   "simple-git-hooks": {
     "pre-commit": "bunx lint-staged"
@@ -45,17 +46,20 @@
     "hono": "^4.7.2",
     "ofetch": "^1.4.1",
     "pathe": "^2.0.3",
-    "srvx": "^0.1.4"
+    "srvx": "^0.1.4",
+    "zod": "^3.24.2"
   },
   "devDependencies": {
     "@echristian/eslint-config": "^0.0.23",
-    "@types/bun": "^1.2.3",
+    "@types/bun": "^1.2.4",
     "bumpp": "^10.0.3",
     "eslint": "^9.21.0",
     "knip": "^5.45.0",
     "lint-staged": "^15.4.3",
     "simple-git-hooks": "^2.11.1",
+    "tinyexec": "^0.3.2",
     "tsup": "^8.4.0",
-    "typescript": "^5.7.3"
+    "typescript": "^5.8.2",
+    "vitest": "^3.0.7"
   }
 }
diff --git a/src/main.ts b/src/main.ts
@@ -9,11 +9,11 @@ import { logger } from "./lib/logger"
 import { initializePort } from "./lib/port"
 import { server } from "./server"
 
-async function runServer(options: {
+export async function runServer(options: {
   port: number
   verbose: boolean
   logFile?: string
-}) {
+}): Promise<void> {
   if (options.verbose) {
     consola.level = 5
     consola.info("Verbose logging enabled")
diff --git a/src/routes/chat-completions/handler.ts b/src/routes/chat-completions/handler.ts
@@ -37,74 +37,54 @@ function createCondensedStreamingResponse(
   }
 }
 
-export async function handlerStreaming(c: Context) {
-  const models = modelsCache.getModels()
-  let payload = await c.req.json<ChatCompletionsPayload>()
-
-  if (isNullish(payload.max_tokens)) {
-    const selectedModel = models?.data.find(
-      (model) => model.id === payload.model,
-    )
-
-    payload = {
-      ...payload,
-      max_tokens: selectedModel?.capabilities.limits.max_output_tokens,
-    }
-  }
-
-  // Convert request headers to a regular object from Headers
-  const requestHeaders = c.req.header()
-
-  // Log the request at the beginning for both streaming and non-streaming cases
-  await logger.logRequest("/chat/completions", "POST", payload, requestHeaders)
-
-  if (payload.stream) {
+function handleStreaming(c: Context, payload: ChatCompletionsPayload) {
+  return streamSSE(c, async (stream) => {
     const response = await chatCompletionsStream(payload)
 
     // For collecting the complete streaming response
     let collectedContent = ""
     let finalChunk: ChatCompletionChunk | null = null
 
-    return streamSSE(c, async (stream) => {
-      for await (const chunk of response) {
-        await stream.writeSSE(chunk as SSEMessage)
+    for await (const chunk of response) {
+      await stream.writeSSE(chunk as SSEMessage)
 
-        if (!logger.options.enabled) continue
+      if (!logger.options.enabled) continue
 
-        // Check if chunk data is "DONE" or not a valid JSON string
-        if (!chunk.data || chunk.data === "[DONE]") {
-          continue // Skip processing this chunk for logging
-        }
+      // Check if chunk data is "DONE" or not a valid JSON string
+      if (!chunk.data || chunk.data === "[DONE]") {
+        continue // Skip processing this chunk for logging
+      }
 
-        try {
-          const data = JSON.parse(chunk.data) as ChatCompletionChunk
+      try {
+        const data = JSON.parse(chunk.data) as ChatCompletionChunk
 
-          // Keep track of the latest chunk for metadata
-          finalChunk = data
+        // Keep track of the latest chunk for metadata
+        finalChunk = data
 
-          // Accumulate content from each delta
-          if (typeof data.choices[0].delta.content === "string") {
-            collectedContent += data.choices[0].delta.content
-          }
-        } catch (error) {
-          // Handle JSON parsing errors gracefully
-          consola.error(`Error parsing SSE chunk data`, error)
-          // Continue processing other chunks
+        // Accumulate content from each delta
+        if (typeof data.choices[0].delta.content === "string") {
+          collectedContent += data.choices[0].delta.content
         }
+      } catch (error) {
+        // Handle JSON parsing errors gracefully
+        consola.error(`Error parsing SSE chunk data`, error)
+        // Continue processing other chunks
       }
+    }
 
-      // After streaming completes, log the condensed response
-      if (finalChunk) {
-        const condensedResponse = createCondensedStreamingResponse(
-          finalChunk,
-          collectedContent,
-        )
+    // After streaming completes, log the condensed response
+    if (finalChunk) {
+      const condensedResponse = createCondensedStreamingResponse(
+        finalChunk,
+        collectedContent,
+      )
 
-        await logger.logResponse("/chat/completions", condensedResponse, {})
-      }
-    })
-  }
+      await logger.logResponse("/chat/completions", condensedResponse, {})
+    }
+  })
+}
 
+async function handleNonStreaming(c: Context, payload: ChatCompletionsPayload) {
   const response = await chatCompletions(payload)
 
   // Get response headers if any
@@ -115,3 +95,31 @@ export async function handlerStreaming(c: Context) {
 
   return c.json(response)
 }
+
+export async function handleCompletion(c: Context) {
+  const models = modelsCache.getModels()
+  let payload = await c.req.json<ChatCompletionsPayload>()
+
+  if (isNullish(payload.max_tokens)) {
+    const selectedModel = models?.data.find(
+      (model) => model.id === payload.model,
+    )
+
+    payload = {
+      ...payload,
+      max_tokens: selectedModel?.capabilities.limits.max_output_tokens,
+    }
+  }
+
+  // Convert request headers to a regular object from Headers
+  const requestHeaders = c.req.header()
+
+  // Log the request at the beginning for both streaming and non-streaming cases
+  await logger.logRequest("/chat/completions", "POST", payload, requestHeaders)
+
+  if (payload.stream) {
+    return handleStreaming(c, payload)
+  }
+
+  return handleNonStreaming(c, payload)
+}
diff --git a/src/routes/chat-completions/route.ts b/src/routes/chat-completions/route.ts
@@ -6,13 +6,13 @@ import { Hono, type Context } from "hono"
 import { FetchError } from "ofetch"
 
 import { logger } from "../../lib/logger"
-import { handlerStreaming } from "./handler"
+import { handleCompletion } from "./handler"
 
 export const completionRoutes = new Hono()
 
 completionRoutes.post("/", async (c) => {
   try {
-    return await handlerStreaming(c)
+    return await handleCompletion(c)
   } catch (error) {
     consola.error("Error occurred:", error)
     return handleError(c, error)
diff --git a/src/services/copilot/chat-completions/types-streaming.ts b/src/services/copilot/chat-completions/types-streaming.ts
@@ -1,63 +1,73 @@
-interface ContentFilterResults {
-  error: {
-    code: string
-    message: string
-  }
-  hate: {
-    filtered: boolean
-    severity: string
-  }
-  self_harm: {
-    filtered: boolean
-    severity: string
-  }
-  sexual: {
-    filtered: boolean
-    severity: string
-  }
-  violence: {
-    filtered: boolean
-    severity: string
-  }
-}
-
-interface ContentFilterOffsets {
-  check_offset: number
-  start_offset: number
-  end_offset: number
-}
-
-interface Delta {
-  content?: string
-  role?: string
-}
-
-interface Choice {
-  index: number
-  content_filter_offsets?: ContentFilterOffsets
-  content_filter_results?: ContentFilterResults
-  delta: Delta
-  finish_reason?: string | null
-}
-
-interface PromptFilterResult {
-  content_filter_results: ContentFilterResults
-  prompt_index: number
-}
-
-interface Usage {
-  completion_tokens: number
-  prompt_tokens: number
-  total_tokens: number
-}
-
-export interface ChatCompletionChunk {
-  choices: [Choice]
-  created: number
-  object: "chat.completion.chunk"
-  id: string
-  model: string
-  system_fingerprint?: string
-  prompt_filter_results?: Array<PromptFilterResult>
-  usage?: Usage | null
-}
+import * as z from "zod"
+
+const ContentFilterResultsSchema = z.object({
+  error: z.object({
+    code: z.string(),
+    message: z.string(),
+  }),
+  hate: z.object({
+    filtered: z.boolean(),
+    severity: z.string(),
+  }),
+  self_harm: z.object({
+    filtered: z.boolean(),
+    severity: z.string(),
+  }),
+  sexual: z.object({
+    filtered: z.boolean(),
+    severity: z.string(),
+  }),
+  violence: z.object({
+    filtered: z.boolean(),
+    severity: z.string(),
+  }),
+})
+
+const ContentFilterOffsetsSchema = z.object({
+  check_offset: z.number(),
+  start_offset: z.number(),
+  end_offset: z.number(),
+})
+
+const DeltaSchema = z.object({
+  content: z.string().optional(),
+  role: z.string().optional(),
+})
+
+const ChoiceSchema = z.object({
+  index: z.number(),
+  content_filter_offsets: ContentFilterOffsetsSchema.optional(),
+  content_filter_results: ContentFilterResultsSchema.optional(),
+  delta: DeltaSchema,
+  finish_reason: z.string().nullable().optional(),
+})
+
+const PromptFilterResultSchema = z.object({
+  content_filter_results: ContentFilterResultsSchema,
+  prompt_index: z.number(),
+})
+
+const UsageSchema = z.object({
+  completion_tokens: z.number(),
+  prompt_tokens: z.number(),
+  total_tokens: z.number(),
+})
+
+export const ChatCompletionChunkSchema = z.object({
+  choices: z.array(ChoiceSchema),
+  created: z.number(),
+  object: z.literal("chat.completion.chunk"),
+  id: z.string(),
+  model: z.string(),
+  system_fingerprint: z.string().optional(),
+  prompt_filter_results: z.array(PromptFilterResultSchema).optional(),
+  usage: UsageSchema.nullable().optional(),
+})
+
+export type ContentFilterResults = z.infer<typeof ContentFilterResultsSchema>
+export type ContentFilterOffsets = z.infer<typeof ContentFilterOffsetsSchema>
+export type Delta = z.infer<typeof DeltaSchema>
+export type Choice = z.infer<typeof ChoiceSchema>
+export type PromptFilterResult = z.infer<typeof PromptFilterResultSchema>
+export type Usage = z.infer<typeof UsageSchema>
+export type ChatCompletionChunk = z.infer<typeof ChatCompletionChunkSchema>
diff --git a/test/main.test.ts b/test/main.test.ts