fix: ai endpoint issues and docs (#3503)

* fix: ai endpoint issues and docs * chore: better error logging * chore: let it crash so i can see logs again * chore: maybe? * fix: use enhanced ai endpoint code from supabase example * chore: more fixes * chore: add two more env vars for ai endpoint * fix: ts * fix: eslint * fix: prompt * chore: pr fixes --------- Co-authored-by: Si Taggart <[email protected]>
twilio-labs · Sep 29, 2023 · b49762c · b49762c
1 parent 0d1ccef
commit b49762c
Show file tree

Hide file tree

Showing 4 changed files with 499 additions and 558 deletions.
diff --git a/internal-docs/engineering/environment-variables.md b/internal-docs/engineering/environment-variables.md
@@ -26,4 +26,8 @@ Full list of Environment variables and where they are needed.
 | CYPRESS_RECORD_KEY                 | Cypress record key so we can record our cypress runs                  | ✅    | ✅         |               |               |
 | PERCY_TOKEN                        | Percy.io token                                                        | ✅    | ✅         |               |               |
 | USE_CYPRESS_VRT                    | Key to enable the cypress vrt integration                             | ✅    |            |               |               |
-| NX_CLOUD_ACCESS_TOKEN             | Token to enable nx cloud cache for builds                             | ✅    | ✅         | ✅            | ✅            |
+| NX_CLOUD_ACCESS_TOKEN              | Token to enable nx cloud cache for builds                             | ✅    | ✅         | ✅            | ✅            |
+| OPENAI_API_KET                     | ChatGPT4 API Key                                                      | ✅    |            | ✅            |               |
+| OPENAI_API_SECRET                  | To prevent unauthorized usage of OpenAI                               | ✅    |            | ✅            |               |
+| SUPABASE_URL                       | Supabase API url                                                      | ✅    |            | ✅            |               |
+| SUPABASE_KEY                       | API Key to query supabase db                                          | ✅    |            | ✅            |               |
diff --git a/packages/paste-website/package.json b/packages/paste-website/package.json
@@ -27,6 +27,7 @@
     "@next/bundle-analyzer": "^13.1.6",
     "@next/mdx": "^13.1.6",
     "@sparticuz/chromium": "^110.0.0",
+    "@supabase/supabase-js": "^2.36.0",
     "@twilio-paste/account-switcher": "^2.0.1",
     "@twilio-paste/alert": "^14.0.0",
     "@twilio-paste/alert-dialog": "^9.1.0",
@@ -133,20 +134,23 @@
     "@types/gtag.js": "^0.0.12",
     "@types/lodash": "^4.14.182",
     "@types/mdx-js__react": "^1.5.5",
+    "ai": "^2.2.13",
     "airtable": "^0.11.6",
     "color": "^3.1.2",
+    "common-tags": "^1.8.2",
     "date-fns": "2.21.3",
     "deepmerge": "4.2.2",
     "dotenv": "^16.0.0",
     "globby-esm": "npm:globby@^13.1.3",
+    "gpt3-tokenizer": "^1.1.5",
     "highcharts": "^9.3.3",
     "highcharts-react-official": "^3.1.0",
-    "langchain": "^0.0.151",
     "lodash": "4.17.21",
     "lottie-web": "^5.7.4",
     "markdown-to-jsx": "^7.3.2",
     "mdast-util-to-string": "^3.1.1",
     "next": "^13.1.6",
+    "openai-edge": "^1.2.2",
     "pretty-format": "^28.1.0",
     "prism-react-renderer": "^1.3.5",
     "puppeteer-core": "^19.6.1",

diff --git a/packages/paste-website/src/pages/api/ai.ts b/packages/paste-website/src/pages/api/ai.ts
@@ -1,80 +1,224 @@
+/* eslint-disable max-classes-per-file */
 /**
  * API endpoint for querying our doc site with ChatGPT4
+ * Copied from Supabase article.
+ * https://supabase.com/blog/chatgpt-supabase-docs
  *
- * Requires two environment variables:
+ * Requires four environment variables:
  * - OPENAI_API_KEY: Your OpenAI API key
  * - OPENAI_API_SECRET: Custom secret to block unauthorized requests
+ * - SUPABASE_URL: Url to your Supabase project
+ * - SUPABASE_KEY: Service role key for your Supabase project
  *
  * Please set these in your .env file and on your deployment boxes configuration.
  */
-import {fileURLToPath} from 'url';
-import path from 'path';
-
-import {loadQAStuffChain} from 'langchain/chains';
-import {OpenAIEmbeddings} from 'langchain/embeddings/openai';
-import {ChatOpenAI} from 'langchain/chat_models/openai';
-import {FaissStore} from 'langchain/vectorstores/faiss';
-import type {NextApiRequest, NextApiResponse} from 'next';
-
-export default async function handler(req: NextApiRequest, res: NextApiResponse): Promise<void> {
-  const {question, secret} = req.body;
-  // Exit early if the required params aren't provided
-  if (!question || secret !== process.env.OPENAI_API_SECRET) {
-    res.status(200).send({answer: 'Please provide a question'});
-    return;
+import type {NextRequest} from 'next/server';
+import {createClient} from '@supabase/supabase-js';
+// @ts-expect-error not typed
+import {codeBlock, oneLine} from 'common-tags';
+import GPT3Tokenizer from 'gpt3-tokenizer';
+import {
+  Configuration,
+  OpenAIApi,
+  type CreateModerationResponse,
+  type CreateEmbeddingResponse,
+  type ChatCompletionRequestMessage,
+} from 'openai-edge';
+import {OpenAIStream, StreamingTextResponse} from 'ai';
+
+class ApplicationError extends Error {
+  // eslint-disable-next-line @typescript-eslint/no-parameter-properties
+  constructor(message: string, public data: Record<string, any> = {}) {
+    super(message);
   }
+}
+class UserError extends ApplicationError {}
+
+const openAiKey = process.env.OPENAI_API_KEY;
+const openAiSecret = process.env.OPENAI_API_SECRET;
+const supabaseUrl = process.env.SUPABASE_URL;
+const supabaseServiceKey = process.env.SUPABASE_KEY;
 
-  /*
-   * Get the FAISS DB
-   */
-  const __filename = fileURLToPath(import.meta.url);
-  const __dirname = path.dirname(__filename);
-  const directory = path.join(__dirname, '../../../indexes/faiss_index');
-  const loadedVectorStore = await FaissStore.loadFromPython(directory, new OpenAIEmbeddings());
-
-  /*
-   * Create the OpenAI model
-   */
-  const model = new ChatOpenAI({
-    modelName: 'gpt-4',
-    temperature: 0,
-  });
-
-  /*
-   * Create the QA stuff chain from our GPT-4 model
-   */
-  const stuffChain = loadQAStuffChain(model);
+const config = new Configuration({
+  apiKey: openAiKey,
+});
+const openai = new OpenAIApi(config);
 
+export const runtime = 'edge';
+
+export default async function handler(req: NextRequest): Promise<void | Response> {
   try {
-    /*
-     * We cannot provide GPT-4 with our entire doc site. For this reason we use the FAISS DB.
-     * This DB is a compressed vector db that allows us to search for similar "documents"
-     * based on a provided question string. We take the top 4 results and provide them to
-     * GPT-4 for further processing.
-     */
-    const inputDocuments = await loadedVectorStore.similaritySearch(question, 4);
-
-    /*
-     * Ask GPT-4 the question and provide the input documents
-     */
-    const answer = await stuffChain.call({
+    if (!openAiKey) {
+      throw new ApplicationError('Missing environment variable OPENAI_API_KEY');
+    }
+    if (!openAiSecret) {
+      throw new ApplicationError('Missing environment variable OPENAI_API_SECRET');
+    }
+
+    if (!supabaseUrl) {
+      throw new ApplicationError('Missing environment variable SUPABASE_URL');
+    }
+
+    if (!supabaseServiceKey) {
+      throw new ApplicationError('Missing environment variable SUPABASE_KEY');
+    }
+
+    const requestData = await req.json();
+
+    if (!requestData) {
+      throw new UserError('Missing request data');
+    }
+
+    const {prompt: query, secret} = requestData;
+
+    if (!secret || secret !== openAiSecret) {
+      throw new UserError("Incorrect 'secret' in request data");
+    }
+
+    if (!query) {
+      throw new UserError("Missing 'prompt' in request data");
+    }
+
+    const supabaseClient = createClient(supabaseUrl, supabaseServiceKey);
+
+    // Moderate the content to comply with OpenAI T&C
+    const sanitizedQuery = query.trim();
+    const moderationResponse: CreateModerationResponse = await openai
+      .createModeration({input: sanitizedQuery})
+      .then((res: any) => res.json());
+
+    // @ts-expect-error this is a bug in the types
+    if (moderationResponse.error) {
+      // @ts-expect-error this is a bug in the types
+      throw new ApplicationError('Failed to moderate content', moderationResponse.error.message);
+    }
+    const [results] = moderationResponse.results;
+
+    if (results.flagged) {
+      throw new UserError('Flagged content', {
+        flagged: true,
+        categories: results.categories,
+      });
+    }
+
+    // Create embedding from query
+    const embeddingResponse = await openai.createEmbedding({
+      model: 'text-embedding-ada-002',
+      input: sanitizedQuery.replaceAll('\n', ' '),
+    });
+
+    if (embeddingResponse.status !== 200) {
+      throw new ApplicationError('Failed to create embedding for question', embeddingResponse);
+    }
+
+    const {
+      data: [{embedding}],
+    }: CreateEmbeddingResponse = await embeddingResponse.json();
+
+    const {error: matchError, data: pageSections} = await supabaseClient.rpc('match_page_sections', {
+      embedding,
+      /* eslint-disable camelcase */
+      match_threshold: 0.78,
+      match_count: 10,
+      min_content_length: 50,
+      /* eslint-enable camelcase */
+    });
+
+    if (matchError) {
+      throw new ApplicationError('Failed to match page sections', matchError);
+    }
+
+    const tokenizer = new GPT3Tokenizer({type: 'gpt3'});
+    let tokenCount = 0;
+    let contextText = '';
+
+    // eslint-disable-next-line unicorn/no-for-loop
+    for (const {content} of pageSections) {
+      const encoded = tokenizer.encode(content);
+      tokenCount += encoded.text.length;
+
+      if (tokenCount >= 1500) {
+        break;
+      }
+
+      contextText += `${content.trim()}\n---\n`;
+    }
+
+    const prompt = codeBlock`
+      ${oneLine`
+        You are a very enthusiastic Paste design system representative who loves
+        to help people! Given the following sections from the Paste
+        documentation, answer the question using only that information,
+        outputted in markdown format. If you are unsure and the answer
+        is not explicitly written in the documentation, say
+        "Sorry, I don't know how to help with that."
+      `}
+
+      Context sections:
+      ${contextText}
+
+      Question: """
+      ${sanitizedQuery}
+      """
+
+      Answer as markdown (including related code snippets if available):
+    `;
+
+    const chatMessage: ChatCompletionRequestMessage = {
+      role: 'user',
+      content: prompt,
+    };
+
+    const response = await openai.createChatCompletion({
+      model: 'gpt-4',
+      messages: [chatMessage],
       // eslint-disable-next-line camelcase
-      input_documents: inputDocuments,
-      question,
+      max_tokens: 512,
+      temperature: 0,
+      stream: true,
     });
 
-    res.status(200).send({answer});
-  } catch (error) {
-    res.status(500).send({error});
+    if (!response.ok) {
+      const error = await response.json();
+      throw new ApplicationError('Failed to generate completion', error);
+    }
+
+    // Transform the response into a readable stream
+    const stream = OpenAIStream(response);
+
+    // Return a StreamingTextResponse, which can be consumed by the client
+    return new StreamingTextResponse(stream);
+  } catch (error: unknown) {
+    if (error instanceof UserError) {
+      return new Response(
+        JSON.stringify({
+          error: error.message,
+          data: error.data,
+        }),
+        {
+          status: 400,
+          headers: {'Content-Type': 'application/json'},
+        }
+      );
+    } else if (error instanceof ApplicationError) {
+      // Print out application errors with their additional data
+      // eslint-disable-next-line no-console
+      console.error(`${error.message}: ${JSON.stringify(error.data)}`);
+    } else {
+      // Print out unexpected errors as is to help with debugging
+      // eslint-disable-next-line no-console
+      console.error(error);
+    }
+
+    return new Response(
+      JSON.stringify({
+        error: 'There was an error processing your request',
+      }),
+      {
+        status: 500,
+        headers: {'Content-Type': 'application/json'},
+      }
+    );
   }
 }
-
-export const config = {
-  api: {
-    bodyParser: {
-      sizeLimit: '10kb',
-    },
-  },
-  // Specifies the maximum allowed duration for this function to execute (in seconds)
-  maxDuration: 15,
-};
+/* eslint-enable max-classes-per-file */