feat(nx-dev): move openai call to edge function (#18747)

2023-08-24 18:59:31 +03:00 · 2023-08-24 18:59:31 +03:00 · bd76b6228f
commit bd76b6228f
parent 12db1e0c77
3 changed files with 100 additions and 47 deletions
--- a/nx-dev/data-access-ai/src/lib/data-access-ai.ts
+++ b/nx-dev/data-access-ai/src/lib/data-access-ai.ts
@ -7,13 +7,7 @@ import {
  createClient,
 } from '@supabase/supabase-js';
 import GPT3Tokenizer from 'gpt3-tokenizer';
-import {
+import { CreateEmbeddingResponse, CreateCompletionResponseUsage } from 'openai';
  Configuration,
  OpenAIApi,
  CreateModerationResponse,
  CreateEmbeddingResponse,
  CreateCompletionResponseUsage,
 } from 'openai';
 import {
  ApplicationError,
  ChatItem,
@ -23,6 +17,7 @@ import {
  getListOfSources,
  getMessageFromResponse,
  initializeChat,
  openAiCall,
  sanitizeLinksInResponse,
  toMarkdownList,
 } from './utils';
@ -37,13 +32,8 @@ const MIN_CONTENT_LENGTH = 50;
 // This is a temporary solution
 const MAX_HISTORY_LENGTH = 30;
 const openAiKey = process.env['NX_OPENAI_KEY'];
 const supabaseUrl = process.env['NX_NEXT_PUBLIC_SUPABASE_URL'];
 const supabaseServiceKey = process.env['NX_SUPABASE_SERVICE_ROLE_KEY'];
 const config = new Configuration({
  apiKey: openAiKey,
 });
 const openai = new OpenAIApi(config);
 let chatFullHistory: ChatItem[] = [];
@ -72,7 +62,7 @@ export async function queryAi(
  }
  try {
-    checkEnvVariables(openAiKey, supabaseUrl, supabaseServiceKey);
+    checkEnvVariables(supabaseUrl, supabaseServiceKey);
    if (!query) {
      throw new UserError('Missing query in request data');
@ -80,10 +70,12 @@ export async function queryAi(
    // Moderate the content to comply with OpenAI T&C
    const sanitizedQuery = query.trim();
-    const moderationResponse: CreateModerationResponse = await openai
+    const moderationResponseObj = await openAiCall(
-      .createModeration({ input: sanitizedQuery })
+      { input: sanitizedQuery },
-      .then((res) => res.data);
+      'moderation'
    );
    const moderationResponse = await moderationResponseObj.json();
    const [results] = moderationResponse.results;
    if (results.flagged) {
@ -104,29 +96,29 @@ export async function queryAi(
     *
     * How the solution looks like with previous response:
     *
-     *     const embeddingResponse = await openai.createEmbedding({
+     *     const embeddingResponse = await openAiCall(
-     *         model: 'text-embedding-ada-002',
+     *      { input: sanitizedQuery + aiResponse },
-     *         input: sanitizedQuery + aiResponse,
+     *      'embedding'
-     *       });
+     *     );
     *
-     * This costs more tokens, so if we see conts skyrocket we remove it.
+     * This costs more tokens, so if we see costs skyrocket we remove it.
     * As it says in the docs, it's a design decision, and it may or may not really improve results.
     */
-    const embeddingResponse = await openai.createEmbedding({
+    const embeddingResponseObj = await openAiCall(
-      model: 'text-embedding-ada-002',
+      { input: sanitizedQuery + aiResponse, model: 'text-embedding-ada-002' },
-      input: sanitizedQuery + aiResponse,
+      'embedding'
    });
    if (embeddingResponse.status !== 200) {
      throw new ApplicationError(
        'Failed to create embedding for question',
        embeddingResponse
    );
    if (!embeddingResponseObj.ok) {
      throw new ApplicationError('Failed to create embedding for question', {
        data: embeddingResponseObj.status,
      });
    }
    const embeddingResponse = await embeddingResponseObj.json();
    const {
      data: [{ embedding }],
-    }: CreateEmbeddingResponse = embeddingResponse.data;
+    }: CreateEmbeddingResponse = embeddingResponse;
    const { error: matchError, data: pageSections } = await supabaseClient.rpc(
      'match_page_sections_2',
@ -196,33 +188,39 @@ export async function queryAi(
    chatFullHistory = chatHistory;
-    const response = await openai.createChatCompletion({
+    const responseObj = await openAiCall(
      {
        model: 'gpt-3.5-turbo-16k',
        messages: chatGptMessages,
        temperature: 0,
        stream: false,
-    });
+      },
      'chatCompletion'
    );
-    if (response.status !== 200) {
+    if (!responseObj.ok) {
-      const error = response.data;
+      throw new ApplicationError('Failed to generate completion', {
-      throw new ApplicationError('Failed to generate completion', error);
+        data: responseObj.status,
      });
    }
    const response = await responseObj.json();
    // Message asking to double-check
    const callout: string =
      '{% callout type="warning" title="Always double-check!" %}The results may not be accurate, so please always double check with our documentation.{% /callout %}\n';
    // Append the warning message asking to double-check!
-    const message = [callout, getMessageFromResponse(response.data)].join('');
+    const message = [callout, getMessageFromResponse(response)].join('');
    const responseWithoutBadLinks = await sanitizeLinksInResponse(message);
    const sources = getListOfSources(pageSections);
-    totalTokensSoFar += response.data.usage?.total_tokens ?? 0;
+    totalTokensSoFar += response.usage?.total_tokens ?? 0;
    return {
      textResponse: responseWithoutBadLinks,
-      usage: response.data.usage as CreateCompletionResponseUsage,
+      usage: response.usage as CreateCompletionResponseUsage,
      sources,
      sourcesMarkdown: toMarkdownList(sources),
    };
--- a/nx-dev/data-access-ai/src/lib/utils.ts
+++ b/nx-dev/data-access-ai/src/lib/utils.ts
@ -93,13 +93,9 @@ async function is404(url: string): Promise<boolean> {
 }
 export function checkEnvVariables(
  openAiKey?: string,
  supabaseUrl?: string,
  supabaseServiceKey?: string
 ) {
  if (!openAiKey) {
    throw new ApplicationError('Missing environment variable NX_OPENAI_KEY');
  }
  if (!supabaseUrl) {
    throw new ApplicationError(
      'Missing environment variable NX_NEXT_PUBLIC_SUPABASE_URL'
@ -211,3 +207,17 @@ export interface ChatItem {
  role: ChatCompletionRequestMessageRoleEnum;
  content: string;
 }
 export function openAiCall(
  input: object,
  action: 'moderation' | 'embedding' | 'chatCompletion'
 ) {
  return fetch('/api/openai-handler', {
    method: 'POST',
    headers: { 'Content-Type': 'application/json' },
    body: JSON.stringify({
      action,
      input: { ...input },
    }),
  });
 }
--- a/nx-dev/nx-dev/pages/api/openai-handler.ts
+++ b/nx-dev/nx-dev/pages/api/openai-handler.ts
@ -0,0 +1,45 @@
 import { NextRequest } from 'next/server';
 const openAiKey = process.env['NX_OPENAI_KEY'];
 export const config = {
  runtime: 'edge',
 };
 export default async function handler(request: NextRequest) {
  const { action, input } = await request.json();
  let apiUrl = 'https://api.openai.com/v1/';
  if (action === 'embedding') {
    apiUrl += 'embeddings';
  } else if (action === 'chatCompletion') {
    apiUrl += 'chat/completions';
  } else if (action === 'moderation') {
    apiUrl += 'moderations';
  } else {
    return new Response('Invalid action', { status: 400 });
  }
  try {
    const response = await fetch(apiUrl, {
      method: 'POST',
      headers: {
        Authorization: `Bearer ${openAiKey}`,
        'Content-Type': 'application/json',
      },
      body: JSON.stringify(input),
    });
    const responseData = await response.json();
    return new Response(JSON.stringify(responseData), {
      status: response.status,
      headers: {
        'content-type': 'application/json',
      },
    });
  } catch (e) {
    console.error('Error processing the request:', e.message);
    return new Response(e.message, { status: 500 });
  }
 }