Skip to content

Commit

Permalink
feat(nx-dev): move openai call to edge function (#18747)
Browse files Browse the repository at this point in the history
  • Loading branch information
mandarini authored Aug 24, 2023
1 parent 12db1e0 commit bd76b62
Show file tree
Hide file tree
Showing 3 changed files with 101 additions and 48 deletions.
86 changes: 42 additions & 44 deletions nx-dev/data-access-ai/src/lib/data-access-ai.ts
Original file line number Diff line number Diff line change
Expand Up @@ -7,13 +7,7 @@ import {
createClient,
} from '@supabase/supabase-js';
import GPT3Tokenizer from 'gpt3-tokenizer';
import {
Configuration,
OpenAIApi,
CreateModerationResponse,
CreateEmbeddingResponse,
CreateCompletionResponseUsage,
} from 'openai';
import { CreateEmbeddingResponse, CreateCompletionResponseUsage } from 'openai';
import {
ApplicationError,
ChatItem,
Expand All @@ -23,6 +17,7 @@ import {
getListOfSources,
getMessageFromResponse,
initializeChat,
openAiCall,
sanitizeLinksInResponse,
toMarkdownList,
} from './utils';
Expand All @@ -37,13 +32,8 @@ const MIN_CONTENT_LENGTH = 50;
// This is a temporary solution
const MAX_HISTORY_LENGTH = 30;

const openAiKey = process.env['NX_OPENAI_KEY'];
const supabaseUrl = process.env['NX_NEXT_PUBLIC_SUPABASE_URL'];
const supabaseServiceKey = process.env['NX_SUPABASE_SERVICE_ROLE_KEY'];
const config = new Configuration({
apiKey: openAiKey,
});
const openai = new OpenAIApi(config);

let chatFullHistory: ChatItem[] = [];

Expand Down Expand Up @@ -72,18 +62,20 @@ export async function queryAi(
}

try {
checkEnvVariables(openAiKey, supabaseUrl, supabaseServiceKey);
checkEnvVariables(supabaseUrl, supabaseServiceKey);

if (!query) {
throw new UserError('Missing query in request data');
}

// Moderate the content to comply with OpenAI T&C
const sanitizedQuery = query.trim();
const moderationResponse: CreateModerationResponse = await openai
.createModeration({ input: sanitizedQuery })
.then((res) => res.data);
const moderationResponseObj = await openAiCall(
{ input: sanitizedQuery },
'moderation'
);

const moderationResponse = await moderationResponseObj.json();
const [results] = moderationResponse.results;

if (results.flagged) {
Expand All @@ -104,29 +96,29 @@ export async function queryAi(
*
* How the solution looks like with previous response:
*
* const embeddingResponse = await openai.createEmbedding({
* model: 'text-embedding-ada-002',
* input: sanitizedQuery + aiResponse,
* });
* const embeddingResponse = await openAiCall(
* { input: sanitizedQuery + aiResponse },
* 'embedding'
* );
*
* This costs more tokens, so if we see conts skyrocket we remove it.
* This costs more tokens, so if we see costs skyrocket we remove it.
* As it says in the docs, it's a design decision, and it may or may not really improve results.
*/
const embeddingResponse = await openai.createEmbedding({
model: 'text-embedding-ada-002',
input: sanitizedQuery + aiResponse,
});

if (embeddingResponse.status !== 200) {
throw new ApplicationError(
'Failed to create embedding for question',
embeddingResponse
);
const embeddingResponseObj = await openAiCall(
{ input: sanitizedQuery + aiResponse, model: 'text-embedding-ada-002' },
'embedding'
);

if (!embeddingResponseObj.ok) {
throw new ApplicationError('Failed to create embedding for question', {
data: embeddingResponseObj.status,
});
}

const embeddingResponse = await embeddingResponseObj.json();
const {
data: [{ embedding }],
}: CreateEmbeddingResponse = embeddingResponse.data;
}: CreateEmbeddingResponse = embeddingResponse;

const { error: matchError, data: pageSections } = await supabaseClient.rpc(
'match_page_sections_2',
Expand Down Expand Up @@ -196,33 +188,39 @@ export async function queryAi(

chatFullHistory = chatHistory;

const response = await openai.createChatCompletion({
model: 'gpt-3.5-turbo-16k',
messages: chatGptMessages,
temperature: 0,
stream: false,
});
const responseObj = await openAiCall(
{
model: 'gpt-3.5-turbo-16k',
messages: chatGptMessages,
temperature: 0,
stream: false,
},
'chatCompletion'
);

if (response.status !== 200) {
const error = response.data;
throw new ApplicationError('Failed to generate completion', error);
if (!responseObj.ok) {
throw new ApplicationError('Failed to generate completion', {
data: responseObj.status,
});
}

const response = await responseObj.json();

// Message asking to double-check
const callout: string =
'{% callout type="warning" title="Always double-check!" %}The results may not be accurate, so please always double check with our documentation.{% /callout %}\n';
// Append the warning message asking to double-check!
const message = [callout, getMessageFromResponse(response.data)].join('');
const message = [callout, getMessageFromResponse(response)].join('');

const responseWithoutBadLinks = await sanitizeLinksInResponse(message);

const sources = getListOfSources(pageSections);

totalTokensSoFar += response.data.usage?.total_tokens ?? 0;
totalTokensSoFar += response.usage?.total_tokens ?? 0;

return {
textResponse: responseWithoutBadLinks,
usage: response.data.usage as CreateCompletionResponseUsage,
usage: response.usage as CreateCompletionResponseUsage,
sources,
sourcesMarkdown: toMarkdownList(sources),
};
Expand Down
18 changes: 14 additions & 4 deletions nx-dev/data-access-ai/src/lib/utils.ts
Original file line number Diff line number Diff line change
Expand Up @@ -93,13 +93,9 @@ async function is404(url: string): Promise<boolean> {
}

export function checkEnvVariables(
openAiKey?: string,
supabaseUrl?: string,
supabaseServiceKey?: string
) {
if (!openAiKey) {
throw new ApplicationError('Missing environment variable NX_OPENAI_KEY');
}
if (!supabaseUrl) {
throw new ApplicationError(
'Missing environment variable NX_NEXT_PUBLIC_SUPABASE_URL'
Expand Down Expand Up @@ -211,3 +207,17 @@ export interface ChatItem {
role: ChatCompletionRequestMessageRoleEnum;
content: string;
}

export function openAiCall(
input: object,
action: 'moderation' | 'embedding' | 'chatCompletion'
) {
return fetch('/api/openai-handler', {
method: 'POST',
headers: { 'Content-Type': 'application/json' },
body: JSON.stringify({
action,
input: { ...input },
}),
});
}
45 changes: 45 additions & 0 deletions nx-dev/nx-dev/pages/api/openai-handler.ts
Original file line number Diff line number Diff line change
@@ -0,0 +1,45 @@
import { NextRequest } from 'next/server';

const openAiKey = process.env['NX_OPENAI_KEY'];
export const config = {
runtime: 'edge',
};

export default async function handler(request: NextRequest) {
const { action, input } = await request.json();

let apiUrl = 'https://api.openai.com/v1/';

if (action === 'embedding') {
apiUrl += 'embeddings';
} else if (action === 'chatCompletion') {
apiUrl += 'chat/completions';
} else if (action === 'moderation') {
apiUrl += 'moderations';
} else {
return new Response('Invalid action', { status: 400 });
}

try {
const response = await fetch(apiUrl, {
method: 'POST',
headers: {
Authorization: `Bearer ${openAiKey}`,
'Content-Type': 'application/json',
},
body: JSON.stringify(input),
});

const responseData = await response.json();

return new Response(JSON.stringify(responseData), {
status: response.status,
headers: {
'content-type': 'application/json',
},
});
} catch (e) {
console.error('Error processing the request:', e.message);
return new Response(e.message, { status: 500 });
}
}

1 comment on commit bd76b62

@vercel
Copy link

@vercel vercel bot commented on bd76b62 Aug 24, 2023

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Successfully deployed to the following URLs:

nx-dev – ./

nx-dev-git-master-nrwl.vercel.app
nx.dev
nx-dev-nrwl.vercel.app
nx-five.vercel.app

Please sign in to comment.