Merge pull request #9 from corbt/sockets

Add streaming for normal text
2023-07-03 22:32:57 -07:00
parent c2c512d751 d434545fdf
commit 4ad33c7a1a
12 changed files with 1023 additions and 73 deletions
--- a/package.json
+++ b/package.json
@@ -5,7 +5,9 @@
  "license": "Apache-2.0",
  "scripts": {
    "build": "next build",
-    "dev": "next dev",
+    "dev:next": "next dev",
    "dev:wss": "pnpm tsx --watch src/wss-server.ts",
    "dev": "concurrently --kill-others 'pnpm dev:next' 'pnpm dev:wss'",
    "postinstall": "prisma generate",
    "lint": "next lint",
    "start": "next start",
@@ -27,28 +29,35 @@
    "@trpc/next": "^10.26.0",
    "@trpc/react-query": "^10.26.0",
    "@trpc/server": "^10.26.0",
    "concurrently": "^8.2.0",
    "cors": "^2.8.5",
    "dayjs": "^1.11.8",
    "dotenv": "^16.3.1",
    "express": "^4.18.2",
    "framer-motion": "^10.12.17",
    "json-stringify-pretty-compact": "^4.0.0",
    "lodash": "^4.17.21",
    "next": "^13.4.2",
    "next-auth": "^4.22.1",
    "nextjs-routes": "^2.0.1",
-    "openai": "^3.3.0",
+    "openai": "4.0.0-beta.2",
    "posthog-js": "^1.68.4",
    "react": "18.2.0",
    "react-dom": "18.2.0",
    "react-icons": "^4.10.1",
    "react-syntax-highlighter": "^15.5.0",
    "react-textarea-autosize": "^8.5.0",
    "socket.io": "^4.7.1",
    "socket.io-client": "^4.7.1",
    "superjson": "1.12.2",
    "tsx": "^3.12.7",
    "zod": "^3.21.4"
  },
  "devDependencies": {
    "@openapi-contrib/openapi-schema-to-json-schema": "^4.0.5",
    "@types/cors": "^2.8.13",
    "@types/eslint": "^8.37.0",
    "@types/express": "^4.17.17",
    "@types/lodash": "^4.14.195",
    "@types/node": "^18.16.0",
    "@types/react": "^18.2.6",
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
--- a/src/components/OutputsTable/OutputCell.tsx
+++ b/src/components/OutputsTable/OutputCell.tsx
@@ -2,13 +2,16 @@ import { api } from "~/utils/api";
 import { type PromptVariant, type Scenario } from "./types";
 import { Spinner, Text, Box, Center, Flex, Icon } from "@chakra-ui/react";
 import { useExperiment } from "~/utils/hooks";
 import { type CreateChatCompletionResponse } from "openai";
 import SyntaxHighlighter from "react-syntax-highlighter";
 import { docco } from "react-syntax-highlighter/dist/cjs/styles/hljs";
 import stringify from "json-stringify-pretty-compact";
-import { type ReactElement } from "react";
+import { useMemo, type ReactElement } from "react";
 import { BsClock } from "react-icons/bs";
 import { type ModelOutput } from "@prisma/client";
 import { type ChatCompletion } from "openai/resources/chat";
 import { generateChannel } from "~/utils/generateChannel";
 import { isObject } from "lodash";
 import useSocket from "~/utils/useSocket";
 export default function OutputCell({
  scenario,
@@ -33,35 +36,52 @@ export default function OutputCell({
  if (variant.config === null || Object.keys(variant.config).length === 0)
    disabledReason = "Save your prompt variant to see output";
  const shouldStream =
    isObject(variant) &&
    "config" in variant &&
    isObject(variant.config) &&
    "stream" in variant.config &&
    variant.config.stream === true;
  const channel = useMemo(() => {
    if (!shouldStream) return;
    return generateChannel();
  }, [shouldStream]);
  const output = api.outputs.get.useQuery(
    {
      scenarioId: scenario.id,
      variantId: variant.id,
      channel,
    },
    { enabled: disabledReason === null }
  );
  // Disconnect from socket if we're not streaming anymore
  const streamedMessage = useSocket(output.isLoading ? channel : undefined);
  const streamedContent = streamedMessage?.choices?.[0]?.message?.content;
  if (!vars) return null;
  if (disabledReason) return <Text color="gray.500">{disabledReason}</Text>;
-  if (output.isLoading)
+  if (output.isLoading && !streamedMessage)
    return (
      <Center h="100%" w="100%">
        <Spinner />
      </Center>
    );
-  if (!output.data) return <Text color="gray.500">Error retrieving output</Text>;
+  if (!output.data && !output.isLoading)
    return <Text color="gray.500">Error retrieving output</Text>;
-  if (output.data.errorMessage) {
+  if (output.data && output.data.errorMessage) {
    return <Text color="red.600">Error: {output.data.errorMessage}</Text>;
  }
-  const response = output.data?.output as unknown as CreateChatCompletionResponse;
+  const response = output.data?.output as unknown as ChatCompletion;
  const message = response?.choices?.[0]?.message;
-  if (message?.function_call) {
+  if (output.data && message?.function_call) {
    const rawArgs = message.function_call.arguments ?? "null";
    let parsedArgs: string;
    try {
@@ -94,10 +114,12 @@ export default function OutputCell({
    );
  }
  const contentToDisplay = message?.content ?? streamedContent ?? JSON.stringify(output.data?.output);
  return (
    <Flex w="100%" h="100%" direction="column" justifyContent="space-between" whiteSpace="pre-wrap">
-      {message?.content ?? JSON.stringify(output.data.output)}
+      {contentToDisplay}
-      <OutputStats modelOutput={output.data} />
+      {output.data && <OutputStats modelOutput={output.data} />}
    </Flex>
  );
 }
--- a/src/env.mjs
+++ b/src/env.mjs
@@ -24,6 +24,7 @@ export const env = createEnv({
      .optional()
      .default("false")
      .transform((val) => val.toLowerCase() === "true"),
    NEXT_PUBLIC_SOCKET_URL: z.string().url().default("http://localhost:3318"),
  },
  /**
@@ -36,6 +37,7 @@ export const env = createEnv({
    OPENAI_API_KEY: process.env.OPENAI_API_KEY,
    NEXT_PUBLIC_POSTHOG_KEY: process.env.NEXT_PUBLIC_POSTHOG_KEY,
    NEXT_PUBLIC_IS_PUBLIC_PLAYGROUND: process.env.NEXT_PUBLIC_IS_PUBLIC_PLAYGROUND,
    NEXT_PUBLIC_SOCKET_URL: process.env.NEXT_PUBLIC_SOCKET_URL,
  },
  /**
   * Run `build` or `dev` with `SKIP_ENV_VALIDATION` to skip env validation.
--- a/src/server/api/autogen.ts
+++ b/src/server/api/autogen.ts
@@ -1,4 +1,5 @@
-import { type CreateChatCompletionRequest } from "openai";
+
 import { type CompletionCreateParams } from "openai/resources/chat";
 import { prisma } from "../db";
 import { openai } from "../utils/openai";
 import { pick } from "lodash";
@@ -62,7 +63,7 @@ export const autogenerateScenarioValues = async (
  if (!experiment || !(variables?.length > 0) || !prompt) return {};
-  const messages: CreateChatCompletionRequest["messages"] = [
+  const messages: CompletionCreateParams.CreateChatCompletionRequestNonStreaming["messages"] = [
    {
      role: "system",
      content:
@@ -90,7 +91,6 @@ export const autogenerateScenarioValues = async (
    .forEach((vals) => {
      messages.push({
        role: "assistant",
        // @ts-expect-error the openai type definition is wrong, the content field is required
        content: null,
        function_call: {
          name: "add_scenario",
@@ -105,7 +105,7 @@ export const autogenerateScenarioValues = async (
  }, {} as Record<string, { type: "string" }>);
  try {
-    const completion = await openai.createChatCompletion({
+    const completion = await openai.chat.completions.create({
      model: "gpt-3.5-turbo-0613",
      messages,
      functions: [
@@ -123,7 +123,7 @@ export const autogenerateScenarioValues = async (
    });
    const parsed = JSON.parse(
-      completion.data.choices[0]?.message?.function_call?.arguments ?? "{}"
+      completion.choices[0]?.message?.function_call?.arguments ?? "{}"
    ) as Record<string, string>;
    return parsed;
  } catch (e) {
--- a/src/server/api/routers/modelOutputs.router.ts
+++ b/src/server/api/routers/modelOutputs.router.ts
@@ -12,7 +12,7 @@ env;
 export const modelOutputsRouter = createTRPCRouter({
  get: publicProcedure
-    .input(z.object({ scenarioId: z.string(), variantId: z.string() }))
+    .input(z.object({ scenarioId: z.string(), variantId: z.string(), channel: z.string().optional() }))
    .query(async ({ input }) => {
      const existing = await prisma.modelOutput.findUnique({
        where: {
@@ -64,7 +64,7 @@ export const modelOutputsRouter = createTRPCRouter({
          timeToComplete: existingResponse.timeToComplete,
        };
      } else {
-        modelResponse = await getChatCompletion(filledTemplate, env.OPENAI_API_KEY);
+        modelResponse = await getChatCompletion(filledTemplate, env.OPENAI_API_KEY, input.channel);
      }
      const modelOutput = await prisma.modelOutput.create({
--- a/src/server/utils/getChatCompletion.ts
+++ b/src/server/utils/getChatCompletion.ts
@@ -1,6 +1,10 @@
 /* eslint-disable @typescript-eslint/no-unsafe-call */
 import { isObject } from "lodash";
 import { type JSONSerializable } from "../types";
 import { Prisma } from "@prisma/client";
 import { streamChatCompletion } from "./openai";
 import { wsConnection } from "~/utils/wsConnection";
 import { type ChatCompletion, type CompletionCreateParams } from "openai/resources/chat";
 type CompletionResponse = {
  output: Prisma.InputJsonValue | typeof Prisma.JsonNull;
@@ -11,7 +15,8 @@ type CompletionResponse = {
 export async function getChatCompletion(
  payload: JSONSerializable,
-  apiKey: string
+  apiKey: string,
  channel?: string,
 ): Promise<CompletionResponse> {
  const start = Date.now();
  const response = await fetch("https://api.openai.com/v1/chat/completions", {
@@ -31,8 +36,21 @@ export async function getChatCompletion(
  };
  try {
    if (channel) {
      const completion = streamChatCompletion(payload as unknown as CompletionCreateParams);
      let finalOutput: ChatCompletion | null = null;
      await (async () => {
        for await (const partialCompletion of completion) {
          finalOutput = partialCompletion
          wsConnection.emit("message", { channel, payload: partialCompletion });
        }
      })().catch((err) => console.error(err));
      resp.output = finalOutput as unknown as Prisma.InputJsonValue;
      resp.timeToComplete = Date.now() - start;
    } else {
      resp.timeToComplete = Date.now() - start;
      resp.output = await response.json();
    }
    if (!response.ok) {
      // If it's an object, try to get the error message
--- a/src/server/utils/openai.ts
+++ b/src/server/utils/openai.ts
@@ -1,8 +1,59 @@
-import { Configuration, OpenAIApi } from "openai";
+import { omit } from "lodash";
 import { env } from "~/env.mjs";
-const configuration = new Configuration({
+import OpenAI from "openai";
-  apiKey: env.OPENAI_API_KEY,
+import { type ChatCompletion, type ChatCompletionChunk, type CompletionCreateParams } from "openai/resources/chat";
 });
-export const openai = new OpenAIApi(configuration);
+// console.log("creating openai client");
 export const openai = new OpenAI({ apiKey: env.OPENAI_API_KEY });
 export const mergeStreamedChunks = (
  base: ChatCompletion | null,
  chunk: ChatCompletionChunk
 ): ChatCompletion => {
  if (base === null) {
    return mergeStreamedChunks({ ...chunk, choices: [] }, chunk);
  }
  const choices = [...base.choices];
  for (const choice of chunk.choices) {
    const baseChoice = choices.find((c) => c.index === choice.index);
    if (baseChoice) {
      baseChoice.finish_reason = choice.finish_reason ?? baseChoice.finish_reason;
      baseChoice.message = baseChoice.message ?? { role: "assistant" };
      if (choice.delta?.content)
        baseChoice.message.content =
          (baseChoice.message.content as string ?? "") + (choice.delta.content ?? "");
      if (choice.delta?.function_call) {
        const fnCall = baseChoice.message.function_call ?? {};
        fnCall.name = (fnCall.name as string ?? "") + (choice.delta.function_call.name as string ?? "");
        fnCall.arguments = (fnCall.arguments as string ?? "") + (choice.delta.function_call.arguments as string ?? "");
      }
    } else {
      choices.push({ ...omit(choice, "delta"), message: { role: "assistant", ...choice.delta } });
    }
  }
  const merged: ChatCompletion = {
    ...base,
    choices,
  };
  return merged;
 };
 export const streamChatCompletion = async function* (body: CompletionCreateParams) {
  // eslint-disable-next-line @typescript-eslint/no-unsafe-call
  const resp = await openai.chat.completions.create({
    ...body,
    stream: true,
  });
  let mergedChunks: ChatCompletion | null = null;
  for await (const part of resp) {
    mergedChunks = mergeStreamedChunks(mergedChunks, part);
    yield mergedChunks;
  }
 };
--- a/src/utils/generateChannel.ts
+++ b/src/utils/generateChannel.ts
@@ -0,0 +1,5 @@
 // generate random channel id
 export const generateChannel = () => {
  return Math.random().toString(36).substring(2, 15) + Math.random().toString(36).substring(2, 15);
 };
--- a/src/utils/useSocket.ts
+++ b/src/utils/useSocket.ts
@@ -0,0 +1,41 @@
 import { type ChatCompletion } from "openai/resources/chat";
 import { useRef, useState, useEffect } from "react";
 import { io, type Socket } from "socket.io-client";
 import { env } from "~/env.mjs";
 const url = env.NEXT_PUBLIC_SOCKET_URL;
 export default function useSocket(channel?: string) {
  const socketRef = useRef<Socket>();
  const [message, setMessage] = useState<ChatCompletion | null>(null);
  useEffect(() => {
    // Create websocket connection
    socketRef.current = io(url);
    socketRef.current.on("connect", () => {
      // Join the specific room
      if (channel) {
        socketRef.current?.emit("join", channel);
        // Listen for 'message' events
        socketRef.current?.on("message", (message: ChatCompletion) => {
          setMessage(message);
        });
      }
    });
    // Unsubscribe and disconnect on cleanup
    return () => {
      if (socketRef.current) {
        if (channel) {
          socketRef.current.off("message");
        }
        socketRef.current.disconnect();
      }
      setMessage(null);
    };
  }, [channel]);
  return message;
 }
--- a/src/utils/wsConnection.ts
+++ b/src/utils/wsConnection.ts
@@ -0,0 +1,4 @@
 import { io } from "socket.io-client";
 import { env } from "~/env.mjs";
 export const wsConnection = io(env.NEXT_PUBLIC_SOCKET_URL);
--- a/src/wss-server.ts
+++ b/src/wss-server.ts
@@ -0,0 +1,36 @@
 import "dotenv/config";
 import express from "express";
 import { createServer } from "http";
 import { Server } from "socket.io";
 import { env } from "./env.mjs";
 import cors from "cors";
 // Get the port from SOCKET_URL
 const port = env.NEXT_PUBLIC_SOCKET_URL?.split(":")[2] || 3318;
 const app = express();
 app.use(cors());
 const server = createServer(app);
 const io = new Server(server, {
  cors: {
    origin: "*",
    methods: ["GET", "POST"],
  },
 });
 io.on("connection", (socket) => {
  // Listen to 'join' event to add this socket to a specific room.
  socket.on("join", (room: string) => {
    socket.join(room)?.catch((err) => console.log(err));
  });
  // When a 'message' event is received, emit it to the room specified
  socket.on("message", (msg: { channel: string; payload: any }) => {
    socket.to(msg.channel).emit("message", msg.payload);
  });
 });
 server.listen(port, () => {
  console.log(`listening on *:${port}`);
 });