Merge branch 'main' into feat-frontend-mainPage

Sma1lboy · Feb 4, 2025 · 334c101 · 334c101
2 parents d0702f5 + c887b7c
commit 334c101
Show file tree

Hide file tree

Showing 9 changed files with 15,026 additions and 1,438 deletions.
diff --git a/backend/package-lock.json b/backend/package-lock.json
diff --git a/frontend/README.md b/frontend/README.md
@@ -3,7 +3,7 @@
 // remember to follow this command to configuration the backend endpoint:
 
 ```sh
-cp .env.example .env
+cp example.env .env
 ```
 
 struct for now

diff --git a/frontend/example.env b/frontend/example.env
@@ -0,0 +1 @@
+NEXT_PUBLIC_GRAPHQL_URL=http://localhost:8080/graphql
diff --git a/frontend/package.json b/frontend/package.json
@@ -41,11 +41,11 @@
     "graphql": "^16.9.0",
     "graphql-ws": "^5.16.0",
     "lucide-react": "^0.445.0",
-    "next": "^14.2.13",
+    "next": "^15.1.4",
     "next-themes": "^0.3.0",
-    "react": "^18.3.1",
+    "react": "^19.0.0",
     "react-code-blocks": "^0.1.6",
-    "react-dom": "^18.3.1",
+    "react-dom": "^19.0.0",
     "react-dropzone": "^14.2.9",
     "react-hook-form": "^7.53.0",
     "react-markdown": "^9.0.1",

diff --git a/frontend/src/app/(main)/chat/page.tsx b/frontend/src/app/(main)/chat/page.tsx
@@ -21,7 +21,7 @@ export default function Home() {
 
   const { models } = useModels();
   const [selectedModel, setSelectedModel] = useState<string>(
-    models[0] || 'gpt-4o'
+    'gpt-4o' 
   );
 
   const { refetchChats } = useChatList();

diff --git a/frontend/src/components/global-loading.tsx b/frontend/src/components/global-loading.tsx
@@ -1,4 +1,4 @@
-'use client';
+"use client";
 import { Loader2 } from 'lucide-react';
 import { useTheme } from 'next-themes';
 

diff --git a/frontend/src/lib/client.ts b/frontend/src/lib/client.ts
@@ -15,22 +15,22 @@ import { getMainDefinition } from '@apollo/client/utilities';
 
 // HTTP Link
 const httpLink = new HttpLink({
+
   uri: process.env.NEXT_PUBLIC_GRAPHQL_URL,
   headers: {
     'Access-Control-Allow-Credentials': 'true',
     'Access-Control-Allow-Origin': '*',
   },
 });
 
-// WebSocket Link (only in browser environment)
-let wsLink = null;
+let wsLink;
 if (typeof window !== 'undefined') {
+  // WebSocket Link
   wsLink = new GraphQLWsLink(
     createClient({
       url: process.env.NEXT_PUBLIC_GRAPHQL_URL,
       connectionParams: () => {
-        const token = localStorage.getItem(LocalStore.accessToken);
-        return token ? { Authorization: `Bearer ${token}` } : {};
+        return {};
       },
     })
   );
@@ -80,26 +80,24 @@ const errorLink = onError(({ graphQLErrors, networkError, operation }) => {
 });
 
 // Split traffic based on operation type
-const splitLink = wsLink
-  ? split(
-      ({ query }) => {
-        if (!query) {
-          throw new Error('Query is undefined');
-        }
-        const definition = getMainDefinition(query);
-        return (
-          definition.kind === 'OperationDefinition' &&
-          definition.operation === 'subscription'
-        );
-      },
-      wsLink,
-      from([errorLink, requestLoggingMiddleware, authMiddleware, httpLink])
-    )
-  : from([errorLink, requestLoggingMiddleware, authMiddleware, httpLink]);
+const splitLink = split(
+  ({ query }) => {
+    if (!query) {
+      throw new Error("Query is undefined");
+    }
+    const definition = getMainDefinition(query);
+    return (
+      definition.kind === 'OperationDefinition' &&
+      definition.operation === 'subscription'
+    );
+  },
+  wsLink,
+  from([errorLink, requestLoggingMiddleware, authMiddleware, httpLink])
+);
 
 // Create Apollo Client
 const client = new ApolloClient({
-  link: splitLink, // Use splitLink here
+  link: wsLink ? from([httpLink, wsLink]) : httpLink,
   cache: new InMemoryCache(),
   defaultOptions: {
     watchQuery: {

diff --git a/llm-server/src/model/openai-model-provider.ts b/llm-server/src/model/openai-model-provider.ts
@@ -0,0 +1,251 @@
+import { Response } from 'express';
+import OpenAI from 'openai';
+import { Logger } from '@nestjs/common';
+import { systemPrompts } from '../prompt/systemPrompt';
+import { ChatCompletionMessageParam } from 'openai/resources/chat/completions';
+import PQueue from 'p-queue';
+import { GenerateMessageParams } from '../types';
+
+export interface OpenAIProviderOptions {
+  maxConcurrentRequests?: number;
+  maxRetries?: number;
+  retryDelay?: number;
+  queueInterval?: number;
+  intervalCap?: number;
+  apiKey?: string;
+  systemPromptKey?: string;
+}
+
+interface QueuedRequest {
+  params: GenerateMessageParams;
+  res: Response;
+  retries: number;
+}
+
+export class OpenAIModelProvider {
+  private readonly logger = new Logger(OpenAIModelProvider.name);
+  private openai: OpenAI;
+  private requestQueue: PQueue;
+  private readonly options: Required<OpenAIProviderOptions>;
+
+  constructor(options: OpenAIProviderOptions = {}) {
+    this.options = {
+      maxConcurrentRequests: 5,
+      maxRetries: 3,
+      retryDelay: 1000,
+      queueInterval: 1000,
+      intervalCap: 10,
+      apiKey: process.env.OPENAI_API_KEY,
+      systemPromptKey: 'codefox-basic',
+      ...options,
+    };
+
+    this.requestQueue = new PQueue({
+      concurrency: this.options.maxConcurrentRequests,
+      interval: this.options.queueInterval,
+      intervalCap: this.options.intervalCap,
+    });
+
+    this.requestQueue.on('active', () => {
+      this.logger.debug(
+        `Queue size: ${this.requestQueue.size}, Pending: ${this.requestQueue.pending}`,
+      );
+    });
+  }
+
+  async initialize(): Promise<void> {
+    this.logger.log('Initializing OpenAI model...');
+    this.logger.log('Options:', this.options);
+    if (!this.options.apiKey) {
+      throw new Error('OpenAI API key is required');
+    }
+
+    this.openai = new OpenAI({
+      apiKey: this.options.apiKey,
+    });
+
+    this.logger.log(
+      `OpenAI model initialized with options:
+      - Max Concurrent Requests: ${this.options.maxConcurrentRequests}
+      - Max Retries: ${this.options.maxRetries}
+      - Queue Interval: ${this.options.queueInterval}ms
+      - Interval Cap: ${this.options.intervalCap}
+      - System Prompt Key: ${this.options.systemPromptKey}`,
+    );
+  }
+
+  async generateStreamingResponse(
+    params: GenerateMessageParams,
+    res: Response,
+  ): Promise<void> {
+    const request: QueuedRequest = {
+      params,
+      res,
+      retries: 0,
+    };
+
+    await this.requestQueue.add(() => this.processRequest(request));
+  }
+
+  private async processRequest(request: QueuedRequest): Promise<void> {
+    const { params, res, retries } = request;
+    const { model, messages } = params as {
+      model: string;
+      messages: ChatCompletionMessageParam[];
+    };
+    this.logger.log(`Processing model (attempt ${model + 1})`);
+    this.logger.log(`Processing request (attempt ${retries + 1})`);
+    const startTime = Date.now();
+
+    try {
+      res.writeHead(200, {
+        'Content-Type': 'text/event-stream',
+        'Cache-Control': 'no-cache',
+        Connection: 'keep-alive',
+      });
+
+      const systemPrompt =
+        systemPrompts[this.options.systemPromptKey]?.systemPrompt || '';
+      const allMessages: ChatCompletionMessageParam[] = [
+        { role: 'system', content: systemPrompt },
+        ...messages,
+      ];
+      console.log(allMessages);
+      const stream = await this.openai.chat.completions.create({
+        model,
+        messages: allMessages,
+        stream: true,
+      });
+
+      let chunkCount = 0;
+      for await (const chunk of stream) {
+        const content = chunk.choices[0]?.delta?.content || '';
+        if (content) {
+          chunkCount++;
+          res.write(`data: ${JSON.stringify(chunk)}\n\n`);
+        }
+      }
+
+      const endTime = Date.now();
+      this.logger.log(
+        `Response completed. Chunks: ${chunkCount}, Time: ${endTime - startTime}ms`,
+      );
+      res.write(`data: [DONE]\n\n`);
+      res.end();
+    } catch (error) {
+      const errorMessage =
+        error instanceof Error ? error.message : String(error);
+
+      const isServerError = errorMessage.includes('server had an error');
+      const isRateLimit = errorMessage.includes('rate_limit');
+      const isAuthError = errorMessage.includes('authentication');
+
+      if ((isServerError || isRateLimit) && retries < this.options.maxRetries) {
+        this.logger.warn(
+          `Request failed (attempt ${retries + 1}) with error: ${errorMessage}. Retrying...`,
+        );
+
+        const baseDelay = isServerError ? 5000 : this.options.retryDelay;
+        const delay = Math.min(baseDelay * Math.pow(2, retries), 30000);
+
+        await new Promise(resolve => setTimeout(resolve, delay));
+
+        request.retries++;
+        await this.requestQueue.add(() => this.processRequest(request));
+        return;
+      }
+
+      const errorResponse = {
+        error: {
+          message: errorMessage,
+          code: isServerError
+            ? 'SERVER_ERROR'
+            : isRateLimit
+              ? 'RATE_LIMIT'
+              : isAuthError
+                ? 'AUTH_ERROR'
+                : 'UNKNOWN_ERROR',
+          retryable: isServerError || isRateLimit,
+          retries: retries,
+        },
+      };
+
+      this.logger.error('Error during OpenAI response generation:', {
+        error: errorResponse,
+        params: {
+          model,
+          messageLength: messages.length,
+        },
+      });
+
+      res.write(`data: ${JSON.stringify(errorResponse)}\n\n`);
+      res.write(`data: [DONE]\n\n`);
+      res.end();
+    }
+  }
+
+  private shouldRetry(error: any): boolean {
+    const retryableErrors = [
+      'rate_limit_exceeded',
+      'timeout',
+      'service_unavailable',
+    ];
+
+    if (error instanceof Error) {
+      return retryableErrors.some(e => error.message.includes(e));
+    }
+
+    return false;
+  }
+
+  async getModelTagsResponse(res: Response): Promise<void> {
+    await this.requestQueue.add(async () => {
+      this.logger.log('Fetching available models from OpenAI...');
+      res.writeHead(200, {
+        'Content-Type': 'text/event-stream',
+        'Cache-Control': 'no-cache',
+        Connection: 'keep-alive',
+      });
+
+      try {
+        const startTime = Date.now();
+        const models = await this.openai.models.list();
+        const response = {
+          models: models,
+        };
+        const endTime = Date.now();
+
+        this.logger.log(
+          `Models fetched: ${models.data.length}, Time: ${endTime - startTime}ms`,
+        );
+
+        res.write(JSON.stringify(response));
+        res.end();
+      } catch (error) {
+        this.logger.error('Error fetching models:', error);
+        const errorResponse = {
+          error: {
+            message: 'Failed to fetch models',
+            code: 'FETCH_MODELS_ERROR',
+            details: error instanceof Error ? error.message : 'Unknown error',
+          },
+        };
+        res.write(`data: ${JSON.stringify(errorResponse)}\n\n`);
+        res.write(`data: [DONE]\n\n`);
+        res.end();
+      }
+    });
+  }
+
+  getOptions(): Readonly<OpenAIProviderOptions> {
+    return { ...this.options };
+  }
+
+  getQueueStatus() {
+    return {
+      size: this.requestQueue.size,
+      pending: this.requestQueue.pending,
+      isPaused: this.requestQueue.isPaused,
+    };
+  }
+}
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1 @@
		NEXT_PUBLIC_GRAPHQL_URL=http://localhost:8080/graphql