**Refactor:** Restructure server package to streamline imports and improve file organization

- Moved `providers`, `services`, `models`, `lib`, and related files to `src` directory within `server` package. - Adjusted imports across the codebase to reflect the new paths. - Renamed several `.ts` files for consistency. - Introduced an `index.ts` in the `ai/providers` package to export all providers. This improves maintainability and aligns with the project's updated directory structure.
2025-09-08 22:56:46 +00:00 · 2025-06-24 20:46:15 -04:00
parent 0b8d67fc69
commit c6e09644e2
62 changed files with 486 additions and 231 deletions
--- a/packages/ai/providers/cloudflareAi.ts
+++ b/packages/ai/providers/cloudflareAi.ts
@@ -0,0 +1,142 @@
+import { OpenAI } from 'openai';
+
+import { ProviderRepository } from './_ProviderRepository.ts';
+import { BaseChatProvider, type CommonProviderParams } from './chat-stream-provider.ts';
+
+export class CloudflareAiChatProvider extends BaseChatProvider {
+  getOpenAIClient(param: CommonProviderParams): OpenAI {
+    return new OpenAI({
+      apiKey: param.env.CLOUDFLARE_API_KEY,
+      baseURL: ProviderRepository.OPENAI_COMPAT_ENDPOINTS.cloudflare.replace(
+        '{CLOUDFLARE_ACCOUNT_ID}',
+        param.env.CLOUDFLARE_ACCOUNT_ID,
+      ),
+    });
+  }
+
+  getStreamParams(param: CommonProviderParams, safeMessages: any[]): any {
+    const generationParams: Record<string, any> = {
+      model: this.getModelWithPrefix(param.model),
+      messages: safeMessages,
+      stream: true,
+    };
+
+    // Set max_tokens based on model
+    if (this.getModelPrefix(param.model) === '@cf/meta') {
+      generationParams['max_tokens'] = 4096;
+    }
+
+    if (this.getModelPrefix(param.model) === '@hf/mistral') {
+      generationParams['max_tokens'] = 4096;
+    }
+
+    if (param.model.toLowerCase().includes('hermes-2-pro-mistral-7b')) {
+      generationParams['max_tokens'] = 1000;
+    }
+
+    if (param.model.toLowerCase().includes('openhermes-2.5-mistral-7b-awq')) {
+      generationParams['max_tokens'] = 1000;
+    }
+
+    if (param.model.toLowerCase().includes('deepseek-coder-6.7b-instruct-awq')) {
+      generationParams['max_tokens'] = 590;
+    }
+
+    if (param.model.toLowerCase().includes('deepseek-math-7b-instruct')) {
+      generationParams['max_tokens'] = 512;
+    }
+
+    if (param.model.toLowerCase().includes('neural-chat-7b-v3-1-awq')) {
+      generationParams['max_tokens'] = 590;
+    }
+
+    if (param.model.toLowerCase().includes('openchat-3.5-0106')) {
+      generationParams['max_tokens'] = 2000;
+    }
+
+    return generationParams;
+  }
+
+  private getModelPrefix(model: string): string {
+    let modelPrefix = `@cf/meta`;
+
+    if (model.toLowerCase().includes('llama')) {
+      modelPrefix = `@cf/meta`;
+    }
+
+    if (model.toLowerCase().includes('hermes-2-pro-mistral-7b')) {
+      modelPrefix = `@hf/nousresearch`;
+    }
+
+    if (model.toLowerCase().includes('mistral-7b-instruct')) {
+      modelPrefix = `@hf/mistral`;
+    }
+
+    if (model.toLowerCase().includes('gemma')) {
+      modelPrefix = `@cf/google`;
+    }
+
+    if (model.toLowerCase().includes('deepseek')) {
+      modelPrefix = `@cf/deepseek-ai`;
+    }
+
+    if (model.toLowerCase().includes('openchat-3.5-0106')) {
+      modelPrefix = `@cf/openchat`;
+    }
+
+    const isNueralChat = model.toLowerCase().includes('neural-chat-7b-v3-1-awq');
+    if (
+      isNueralChat ||
+      model.toLowerCase().includes('openhermes-2.5-mistral-7b-awq') ||
+      model.toLowerCase().includes('zephyr-7b-beta-awq') ||
+      model.toLowerCase().includes('deepseek-coder-6.7b-instruct-awq')
+    ) {
+      modelPrefix = `@hf/thebloke`;
+    }
+
+    return modelPrefix;
+  }
+
+  private getModelWithPrefix(model: string): string {
+    return `${this.getModelPrefix(model)}/${model}`;
+  }
+
+  async processChunk(chunk: any, dataCallback: (data: any) => void): Promise<boolean> {
+    if (chunk.choices && chunk.choices[0]?.finish_reason === 'stop') {
+      dataCallback({ type: 'chat', data: chunk });
+      return true;
+    }
+
+    dataCallback({ type: 'chat', data: chunk });
+    return false;
+  }
+}
+
+export class CloudflareAISdk {
+  private static provider = new CloudflareAiChatProvider();
+
+  static async handleCloudflareAIStream(
+    param: {
+      openai: OpenAI;
+      systemPrompt: any;
+      preprocessedContext: any;
+      maxTokens: unknown | number | undefined;
+      messages: any;
+      model: string;
+      env: Env;
+    },
+    dataCallback: (data: any) => void,
+  ) {
+    return this.provider.handleStream(
+      {
+        systemPrompt: param.systemPrompt,
+        preprocessedContext: param.preprocessedContext,
+        maxTokens: param.maxTokens,
+        messages: param.messages,
+        model: param.model,
+        env: param.env,
+      },
+      dataCallback,
+    );
+  }
+}