Compare commits
15 Commits
proj-styli
...
project-me
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
4e176088e9 | ||
|
|
3cec1f7786 | ||
|
|
81fbaeae44 | ||
|
|
b3d8f96fa8 | ||
|
|
5277afa199 | ||
|
|
54d97ddfa8 | ||
|
|
1f8e3b820f | ||
|
|
76c34d64e6 | ||
|
|
454ac9a0d3 | ||
|
|
5ed7adadf9 | ||
|
|
b8e0f392ab | ||
|
|
b2af83341d | ||
|
|
e6d229d5f9 | ||
|
|
1a6ae3aef7 | ||
|
|
6c060c6ea0 |
@@ -65,7 +65,14 @@ OpenPipe includes a tool to generate new test scenarios based on your existing p
|
|||||||
4. Clone this repository: `git clone https://github.com/openpipe/openpipe`
|
4. Clone this repository: `git clone https://github.com/openpipe/openpipe`
|
||||||
5. Install the dependencies: `cd openpipe && pnpm install`
|
5. Install the dependencies: `cd openpipe && pnpm install`
|
||||||
6. Create a `.env` file (`cp .env.example .env`) and enter your `OPENAI_API_KEY`.
|
6. Create a `.env` file (`cp .env.example .env`) and enter your `OPENAI_API_KEY`.
|
||||||
7. Update `DATABASE_URL` if necessary to point to your Postgres instance and run `pnpm prisma db push` to create the database.
|
7. Update `DATABASE_URL` if necessary to point to your Postgres instance and run `pnpm prisma migrate dev` to create the database.
|
||||||
8. Create a [GitHub OAuth App](https://docs.github.com/en/apps/oauth-apps/building-oauth-apps/creating-an-oauth-app) and update the `GITHUB_CLIENT_ID` and `GITHUB_CLIENT_SECRET` values. (Note: a PR to make auth optional when running locally would be a great contribution!)
|
8. Create a [GitHub OAuth App](https://docs.github.com/en/apps/oauth-apps/building-oauth-apps/creating-an-oauth-app) and update the `GITHUB_CLIENT_ID` and `GITHUB_CLIENT_SECRET` values. (Note: a PR to make auth optional when running locally would be a great contribution!)
|
||||||
9. Start the app: `pnpm dev`.
|
9. Start the app: `pnpm dev`.
|
||||||
10. Navigate to [http://localhost:3000](http://localhost:3000)
|
10. Navigate to [http://localhost:3000](http://localhost:3000)
|
||||||
|
|
||||||
|
## Testing Locally
|
||||||
|
|
||||||
|
1. Copy your `.env` file to `.env.test`.
|
||||||
|
2. Update the `DATABASE_URL` to have a different database name than your development one
|
||||||
|
3. Run `DATABASE_URL=[your new datatase url] pnpm prisma migrate dev --skip-seed --skip-generate`
|
||||||
|
4. Run `pnpm test`
|
||||||
1
app/.gitignore
vendored
@@ -34,6 +34,7 @@ yarn-error.log*
|
|||||||
# do not commit any .env files to git, except for the .env.example file. https://create.t3.gg/en/usage/env-variables#using-environment-variables
|
# do not commit any .env files to git, except for the .env.example file. https://create.t3.gg/en/usage/env-variables#using-environment-variables
|
||||||
.env
|
.env
|
||||||
.env*.local
|
.env*.local
|
||||||
|
.env.test
|
||||||
|
|
||||||
# vercel
|
# vercel
|
||||||
.vercel
|
.vercel
|
||||||
|
|||||||
@@ -19,7 +19,7 @@
|
|||||||
"codegen": "tsx src/server/scripts/client-codegen.ts",
|
"codegen": "tsx src/server/scripts/client-codegen.ts",
|
||||||
"seed": "tsx prisma/seed.ts",
|
"seed": "tsx prisma/seed.ts",
|
||||||
"check": "concurrently 'pnpm lint' 'pnpm tsc' 'pnpm prettier . --check'",
|
"check": "concurrently 'pnpm lint' 'pnpm tsc' 'pnpm prettier . --check'",
|
||||||
"test": "pnpm vitest --no-threads"
|
"test": "pnpm vitest"
|
||||||
},
|
},
|
||||||
"dependencies": {
|
"dependencies": {
|
||||||
"@anthropic-ai/sdk": "^0.5.8",
|
"@anthropic-ai/sdk": "^0.5.8",
|
||||||
|
|||||||
@@ -0,0 +1 @@
|
|||||||
|
CREATE EXTENSION IF NOT EXISTS "uuid-ossp";
|
||||||
@@ -0,0 +1,15 @@
|
|||||||
|
/*
|
||||||
|
Warnings:
|
||||||
|
|
||||||
|
- You are about to rename the column `completionTokens` to `outputTokens` on the `ModelResponse` table.
|
||||||
|
- You are about to rename the column `promptTokens` to `inputTokens` on the `ModelResponse` table.
|
||||||
|
|
||||||
|
*/
|
||||||
|
|
||||||
|
-- Rename completionTokens to outputTokens
|
||||||
|
ALTER TABLE "ModelResponse"
|
||||||
|
RENAME COLUMN "completionTokens" TO "outputTokens";
|
||||||
|
|
||||||
|
-- Rename promptTokens to inputTokens
|
||||||
|
ALTER TABLE "ModelResponse"
|
||||||
|
RENAME COLUMN "promptTokens" TO "inputTokens";
|
||||||
@@ -117,8 +117,8 @@ model ModelResponse {
|
|||||||
receivedAt DateTime?
|
receivedAt DateTime?
|
||||||
output Json?
|
output Json?
|
||||||
cost Float?
|
cost Float?
|
||||||
promptTokens Int?
|
inputTokens Int?
|
||||||
completionTokens Int?
|
outputTokens Int?
|
||||||
statusCode Int?
|
statusCode Int?
|
||||||
errorMessage String?
|
errorMessage String?
|
||||||
retryTime DateTime?
|
retryTime DateTime?
|
||||||
|
|||||||
|
Before Width: | Height: | Size: 15 KiB After Width: | Height: | Size: 15 KiB |
|
Before Width: | Height: | Size: 6.8 KiB After Width: | Height: | Size: 6.1 KiB |
|
Before Width: | Height: | Size: 22 KiB After Width: | Height: | Size: 49 KiB |
|
Before Width: | Height: | Size: 6.1 KiB After Width: | Height: | Size: 5.3 KiB |
|
Before Width: | Height: | Size: 704 B After Width: | Height: | Size: 800 B |
|
Before Width: | Height: | Size: 1.1 KiB After Width: | Height: | Size: 1.3 KiB |
|
Before Width: | Height: | Size: 15 KiB After Width: | Height: | Size: 15 KiB |
|
Before Width: | Height: | Size: 3.0 KiB After Width: | Height: | Size: 3.4 KiB |
@@ -9,10 +9,9 @@ Created by potrace 1.14, written by Peter Selinger 2001-2017
|
|||||||
</metadata>
|
</metadata>
|
||||||
<g transform="translate(0.000000,550.000000) scale(0.100000,-0.100000)"
|
<g transform="translate(0.000000,550.000000) scale(0.100000,-0.100000)"
|
||||||
fill="#000000" stroke="none">
|
fill="#000000" stroke="none">
|
||||||
<path d="M813 5478 c-18 -13 -37 -36 -43 -52 -6 -19 -10 -236 -10 -603 0 -638
|
<path d="M785 5474 l-25 -27 0 -622 0 -622 25 -27 24 -26 171 0 170 0 0 -2050
|
||||||
-1 -626 65 -657 25 -12 67 -16 179 -16 l146 0 0 -2032 0 -2032 23 -33 c12 -18
|
0 -2051 25 -25 24 -24 1557 2 1556 3 19 24 c19 23 19 70 19 2072 l0 2049 169
|
||||||
35 -37 51 -43 19 -7 539 -10 1528 -10 1663 0 1549 -5 1582 65 14 30 16 235 16
|
0 c165 0 169 1 195 25 l26 24 0 626 0 626 -26 24 -27 25 -1939 0 -1939 0 -24
|
||||||
2059 l0 2026 156 0 156 0 39 39 39 39 0 587 c0 651 1 638 -65 669 -30 14 -223
|
-26z"/>
|
||||||
16 -1932 16 l-1898 0 -32 -22z"/>
|
|
||||||
</g>
|
</g>
|
||||||
</svg>
|
</svg>
|
||||||
|
|||||||
|
Before Width: | Height: | Size: 858 B After Width: | Height: | Size: 755 B |
@@ -1,5 +1,28 @@
|
|||||||
<svg width="380" height="320" viewBox="0 0 380 320" fill="none" xmlns="http://www.w3.org/2000/svg">
|
<svg width="398" height="550" viewBox="0 0 398 550" fill="none" xmlns="http://www.w3.org/2000/svg">
|
||||||
<path d="M72 320L122.5 231L130.5 150.5L115 73L72 0H312L265 64.5L257 158.5L265 249L312 320H72Z" fill="#FF5733"/>
|
<path d="M39 125H359V542C359 546.418 355.418 550 351 550H47C42.5817 550 39 546.418 39 542V125Z" fill="black"/>
|
||||||
<path d="M67.027 9.5C72.9909 9.5 79.5196 12.3449 86.3672 19.2588C93.2495 26.2075 99.8845 36.7468 105.66 50.5336C117.194 78.0671 124.554 116.764 124.554 160C124.554 203.236 117.194 241.933 105.66 269.466C99.8845 283.253 93.2495 293.793 86.3672 300.741C79.5196 307.655 72.9909 310.5 67.027 310.5C61.0632 310.5 54.5345 307.655 47.6868 300.741C40.8045 293.793 34.1695 283.253 28.394 269.466C16.8596 241.933 9.5 203.236 9.5 160C9.5 116.764 16.8596 78.0671 28.394 50.5336C34.1695 36.7468 40.8045 26.2075 47.6868 19.2588C54.5345 12.3449 61.0632 9.5 67.027 9.5Z" stroke="#FF5733" stroke-width="19"/>
|
<path d="M0 8C0 3.58172 3.58172 0 8 0H390C394.418 0 398 3.58172 398 8V127C398 131.418 394.418 135 390 135H7.99999C3.58171 135 0 131.418 0 127V8Z" fill="black"/>
|
||||||
<path d="M312.027 9.5C317.991 9.5 324.52 12.3449 331.367 19.2588C338.25 26.2075 344.885 36.7468 350.66 50.5336C362.194 78.0671 369.554 116.764 369.554 160C369.554 203.236 362.194 241.933 350.66 269.466C344.885 283.253 338.25 293.793 331.367 300.741C324.52 307.655 317.991 310.5 312.027 310.5C306.063 310.5 299.534 307.655 292.687 300.741C285.805 293.793 279.17 283.253 273.394 269.466C261.86 241.933 254.5 203.236 254.5 160C254.5 116.764 261.86 78.0671 273.394 50.5336C279.17 36.7468 285.805 26.2075 292.687 19.2588C299.534 12.3449 306.063 9.5 312.027 9.5Z" stroke="#FF5733" stroke-width="19"/>
|
<path d="M50 135H348V535C348 537.209 346.209 539 344 539H54C51.7909 539 50 537.209 50 535V135Z" fill="#FF5733"/>
|
||||||
|
<path d="M11 14.0001C11 11.791 12.7909 10.0001 15 10.0001H384C386.209 10.0001 388 11.791 388 14.0001V120C388 122.209 386.209 124 384 124H15C12.7909 124 11 122.209 11 120V14.0001Z" fill="#FF5733"/>
|
||||||
|
<path d="M11 14.0001C11 11.791 12.7909 10.0001 15 10.0001H384C386.209 10.0001 388 11.791 388 14.0001V120C388 122.209 386.209 124 384 124H15C12.7909 124 11 122.209 11 120V14.0001Z" fill="url(#paint0_linear_102_49)"/>
|
||||||
|
<path d="M50 134H348V535C348 537.209 346.209 539 344 539H54C51.7909 539 50 537.209 50 535V134Z" fill="url(#paint1_linear_102_49)"/>
|
||||||
|
<path d="M108 142H156V535H108V142Z" fill="white"/>
|
||||||
|
<path d="M300 135H348V535C348 537.209 346.209 539 344 539H300V135Z" fill="white" fill-opacity="0.25"/>
|
||||||
|
<path d="M96 142H108V535H96V142Z" fill="white" fill-opacity="0.5"/>
|
||||||
|
<path d="M84 10.0001H133V120H84V10.0001Z" fill="white"/>
|
||||||
|
<path d="M339 10.0001H384C386.209 10.0001 388 11.791 388 14.0001V120C388 122.209 386.209 124 384 124H339V10.0001Z" fill="white" fill-opacity="0.25"/>
|
||||||
|
<path d="M71.9995 10.0001H83.9995V120H71.9995V10.0001Z" fill="white" fill-opacity="0.5"/>
|
||||||
|
<path d="M108 534.529H156V539.019H108V534.529Z" fill="#AAAAAA"/>
|
||||||
|
<path opacity="0.5" d="M95.9927 534.529H107.982V539.019H95.9927V534.529Z" fill="#AAAAAA"/>
|
||||||
|
<path d="M84.0029 119.887H133.007V124.027H84.0029V119.887Z" fill="#AAAAAA"/>
|
||||||
|
<path opacity="0.5" d="M71.9883 119.887H83.978V124.027H71.9883V119.887Z" fill="#AAAAAA"/>
|
||||||
|
<defs>
|
||||||
|
<linearGradient id="paint0_linear_102_49" x1="335" y1="67.0001" x2="137" y2="67.0001" gradientUnits="userSpaceOnUse">
|
||||||
|
<stop stop-color="#D62600"/>
|
||||||
|
<stop offset="1" stop-color="#FF5733" stop-opacity="0"/>
|
||||||
|
</linearGradient>
|
||||||
|
<linearGradient id="paint1_linear_102_49" x1="306.106" y1="336.5" x2="149.597" y2="336.5" gradientUnits="userSpaceOnUse">
|
||||||
|
<stop stop-color="#D62600"/>
|
||||||
|
<stop offset="1" stop-color="#FF5733" stop-opacity="0"/>
|
||||||
|
</linearGradient>
|
||||||
|
</defs>
|
||||||
</svg>
|
</svg>
|
||||||
|
|||||||
|
Before Width: | Height: | Size: 1.4 KiB After Width: | Height: | Size: 2.3 KiB |
|
Before Width: | Height: | Size: 62 KiB After Width: | Height: | Size: 26 KiB |
@@ -19,7 +19,7 @@ const CopiableCode = ({ code }: { code: string }) => {
|
|||||||
w="full"
|
w="full"
|
||||||
justifyContent="space-between"
|
justifyContent="space-between"
|
||||||
>
|
>
|
||||||
<Text fontFamily="inconsolata" fontWeight="bold" letterSpacing={0.5}>
|
<Text fontFamily="inconsolata" fontWeight="bold" letterSpacing={0.5} overflowX="auto">
|
||||||
{code}
|
{code}
|
||||||
</Text>
|
</Text>
|
||||||
<Tooltip closeOnClick={false} label={copied ? "Copied!" : "Copy to clipboard"}>
|
<Tooltip closeOnClick={false} label={copied ? "Copied!" : "Copy to clipboard"}>
|
||||||
|
|||||||
@@ -8,8 +8,8 @@ export default function Favicon() {
|
|||||||
<link rel="icon" type="image/png" sizes="16x16" href="/favicons/favicon-16x16.png" />
|
<link rel="icon" type="image/png" sizes="16x16" href="/favicons/favicon-16x16.png" />
|
||||||
<link rel="manifest" href="/favicons/site.webmanifest" />
|
<link rel="manifest" href="/favicons/site.webmanifest" />
|
||||||
<link rel="shortcut icon" href="/favicons/favicon.ico" />
|
<link rel="shortcut icon" href="/favicons/favicon.ico" />
|
||||||
|
<link rel="mask-icon" href="/favicons/safari-pinned-tab.svg" color="#5bbad5" />
|
||||||
<meta name="msapplication-TileColor" content="#da532c" />
|
<meta name="msapplication-TileColor" content="#da532c" />
|
||||||
<meta name="msapplication-config" content="/favicons/browserconfig.xml" />
|
|
||||||
<meta name="theme-color" content="#ffffff" />
|
<meta name="theme-color" content="#ffffff" />
|
||||||
</Head>
|
</Head>
|
||||||
);
|
);
|
||||||
|
|||||||
@@ -12,6 +12,7 @@ import {
|
|||||||
Select,
|
Select,
|
||||||
FormHelperText,
|
FormHelperText,
|
||||||
Code,
|
Code,
|
||||||
|
IconButton,
|
||||||
} from "@chakra-ui/react";
|
} from "@chakra-ui/react";
|
||||||
import { type Evaluation, EvalType } from "@prisma/client";
|
import { type Evaluation, EvalType } from "@prisma/client";
|
||||||
import { useCallback, useState } from "react";
|
import { useCallback, useState } from "react";
|
||||||
@@ -183,46 +184,37 @@ export default function EditEvaluations() {
|
|||||||
<Text flex={1}>
|
<Text flex={1}>
|
||||||
{evaluation.evalType}: "{evaluation.value}"
|
{evaluation.evalType}: "{evaluation.value}"
|
||||||
</Text>
|
</Text>
|
||||||
<Button
|
|
||||||
|
<IconButton
|
||||||
|
aria-label="Edit"
|
||||||
variant="unstyled"
|
variant="unstyled"
|
||||||
color="gray.400"
|
|
||||||
height="unset"
|
|
||||||
width="unset"
|
|
||||||
minW="unset"
|
minW="unset"
|
||||||
|
color="gray.400"
|
||||||
onClick={() => setEditingId(evaluation.id)}
|
onClick={() => setEditingId(evaluation.id)}
|
||||||
_hover={{
|
_hover={{ color: "gray.800", cursor: "pointer" }}
|
||||||
color: "gray.800",
|
icon={<Icon as={BsPencil} />}
|
||||||
cursor: "pointer",
|
/>
|
||||||
}}
|
<IconButton
|
||||||
>
|
aria-label="Delete"
|
||||||
<Icon as={BsPencil} boxSize={4} />
|
|
||||||
</Button>
|
|
||||||
<Button
|
|
||||||
variant="unstyled"
|
variant="unstyled"
|
||||||
color="gray.400"
|
|
||||||
height="unset"
|
|
||||||
width="unset"
|
|
||||||
minW="unset"
|
minW="unset"
|
||||||
|
color="gray.400"
|
||||||
onClick={() => onDelete(evaluation.id)}
|
onClick={() => onDelete(evaluation.id)}
|
||||||
_hover={{
|
_hover={{ color: "gray.800", cursor: "pointer" }}
|
||||||
color: "gray.800",
|
icon={<Icon as={BsX} boxSize={6} />}
|
||||||
cursor: "pointer",
|
/>
|
||||||
}}
|
|
||||||
>
|
|
||||||
<Icon as={BsX} boxSize={6} />
|
|
||||||
</Button>
|
|
||||||
</HStack>
|
</HStack>
|
||||||
),
|
),
|
||||||
)}
|
)}
|
||||||
{editingId == null && (
|
{editingId == null && (
|
||||||
<Button
|
<Button
|
||||||
onClick={() => setEditingId("new")}
|
onClick={() => setEditingId("new")}
|
||||||
alignSelf="flex-start"
|
alignSelf="end"
|
||||||
size="sm"
|
size="sm"
|
||||||
mt={4}
|
mt={4}
|
||||||
colorScheme="blue"
|
colorScheme="blue"
|
||||||
>
|
>
|
||||||
Add Evaluation
|
New Evaluation
|
||||||
</Button>
|
</Button>
|
||||||
)}
|
)}
|
||||||
{editingId == "new" && (
|
{editingId == "new" && (
|
||||||
|
|||||||
@@ -1,103 +1,185 @@
|
|||||||
import { Text, Button, HStack, Heading, Icon, Input, Stack } from "@chakra-ui/react";
|
import { Text, Button, HStack, Heading, Icon, IconButton, Stack, VStack } from "@chakra-ui/react";
|
||||||
import { useState } from "react";
|
import { type TemplateVariable } from "@prisma/client";
|
||||||
import { BsCheck, BsX } from "react-icons/bs";
|
import { useEffect, useState } from "react";
|
||||||
|
import { BsPencil, BsX } from "react-icons/bs";
|
||||||
import { api } from "~/utils/api";
|
import { api } from "~/utils/api";
|
||||||
import { useExperiment, useHandledAsyncCallback } from "~/utils/hooks";
|
import { useExperiment, useHandledAsyncCallback, useScenarioVars } from "~/utils/hooks";
|
||||||
|
import { maybeReportError } from "~/utils/standardResponses";
|
||||||
|
import { FloatingLabelInput } from "./FloatingLabelInput";
|
||||||
|
|
||||||
|
export const ScenarioVar = ({
|
||||||
|
variable,
|
||||||
|
isEditing,
|
||||||
|
setIsEditing,
|
||||||
|
}: {
|
||||||
|
variable: Pick<TemplateVariable, "id" | "label">;
|
||||||
|
isEditing: boolean;
|
||||||
|
setIsEditing: (isEditing: boolean) => void;
|
||||||
|
}) => {
|
||||||
|
const utils = api.useContext();
|
||||||
|
|
||||||
|
const [label, setLabel] = useState(variable.label);
|
||||||
|
|
||||||
|
useEffect(() => {
|
||||||
|
setLabel(variable.label);
|
||||||
|
}, [variable.label]);
|
||||||
|
|
||||||
|
const renameVarMutation = api.scenarioVars.rename.useMutation();
|
||||||
|
const [onRename] = useHandledAsyncCallback(async () => {
|
||||||
|
const resp = await renameVarMutation.mutateAsync({ id: variable.id, label });
|
||||||
|
if (maybeReportError(resp)) return;
|
||||||
|
|
||||||
|
setIsEditing(false);
|
||||||
|
await utils.scenarioVars.list.invalidate();
|
||||||
|
await utils.scenarios.list.invalidate();
|
||||||
|
}, [label, variable.id]);
|
||||||
|
|
||||||
|
const deleteMutation = api.scenarioVars.delete.useMutation();
|
||||||
|
const [onDeleteVar] = useHandledAsyncCallback(async () => {
|
||||||
|
await deleteMutation.mutateAsync({ id: variable.id });
|
||||||
|
await utils.scenarioVars.list.invalidate();
|
||||||
|
}, [variable.id]);
|
||||||
|
|
||||||
|
if (isEditing) {
|
||||||
|
return (
|
||||||
|
<HStack w="full">
|
||||||
|
<FloatingLabelInput
|
||||||
|
flex={1}
|
||||||
|
label="Renamed Variable"
|
||||||
|
value={label}
|
||||||
|
onChange={(e) => setLabel(e.target.value)}
|
||||||
|
onKeyDown={(e) => {
|
||||||
|
if (e.key === "Enter") {
|
||||||
|
e.preventDefault();
|
||||||
|
onRename();
|
||||||
|
}
|
||||||
|
// If the user types a space, replace it with an underscore
|
||||||
|
if (e.key === " ") {
|
||||||
|
e.preventDefault();
|
||||||
|
setLabel((label) => label && `${label}_`);
|
||||||
|
}
|
||||||
|
}}
|
||||||
|
/>
|
||||||
|
<Button size="sm" onClick={() => setIsEditing(false)}>
|
||||||
|
Cancel
|
||||||
|
</Button>
|
||||||
|
<Button size="sm" colorScheme="blue" onClick={onRename}>
|
||||||
|
Save
|
||||||
|
</Button>
|
||||||
|
</HStack>
|
||||||
|
);
|
||||||
|
} else {
|
||||||
|
return (
|
||||||
|
<HStack w="full" borderTopWidth={1} borderColor="gray.200">
|
||||||
|
<Text flex={1}>{variable.label}</Text>
|
||||||
|
<IconButton
|
||||||
|
aria-label="Edit"
|
||||||
|
variant="unstyled"
|
||||||
|
minW="unset"
|
||||||
|
color="gray.400"
|
||||||
|
onClick={() => setIsEditing(true)}
|
||||||
|
_hover={{ color: "gray.800", cursor: "pointer" }}
|
||||||
|
icon={<Icon as={BsPencil} />}
|
||||||
|
/>
|
||||||
|
<IconButton
|
||||||
|
aria-label="Delete"
|
||||||
|
variant="unstyled"
|
||||||
|
minW="unset"
|
||||||
|
color="gray.400"
|
||||||
|
onClick={onDeleteVar}
|
||||||
|
_hover={{ color: "gray.800", cursor: "pointer" }}
|
||||||
|
icon={<Icon as={BsX} boxSize={6} />}
|
||||||
|
/>
|
||||||
|
</HStack>
|
||||||
|
);
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
export default function EditScenarioVars() {
|
export default function EditScenarioVars() {
|
||||||
const experiment = useExperiment();
|
const experiment = useExperiment();
|
||||||
const vars =
|
const vars = useScenarioVars();
|
||||||
api.templateVars.list.useQuery({ experimentId: experiment.data?.id ?? "" }).data ?? [];
|
|
||||||
|
const [currentlyEditingId, setCurrentlyEditingId] = useState<string | null>(null);
|
||||||
|
|
||||||
const [newVariable, setNewVariable] = useState<string>("");
|
const [newVariable, setNewVariable] = useState<string>("");
|
||||||
const newVarIsValid = newVariable.length > 0 && !vars.map((v) => v.label).includes(newVariable);
|
const newVarIsValid = newVariable?.length ?? 0 > 0;
|
||||||
|
|
||||||
const utils = api.useContext();
|
const utils = api.useContext();
|
||||||
const addVarMutation = api.templateVars.create.useMutation();
|
const addVarMutation = api.scenarioVars.create.useMutation();
|
||||||
const [onAddVar] = useHandledAsyncCallback(async () => {
|
const [onAddVar] = useHandledAsyncCallback(async () => {
|
||||||
if (!experiment.data?.id) return;
|
if (!experiment.data?.id) return;
|
||||||
if (!newVarIsValid) return;
|
if (!newVariable) return;
|
||||||
await addVarMutation.mutateAsync({
|
const resp = await addVarMutation.mutateAsync({
|
||||||
experimentId: experiment.data.id,
|
experimentId: experiment.data.id,
|
||||||
label: newVariable,
|
label: newVariable,
|
||||||
});
|
});
|
||||||
await utils.templateVars.list.invalidate();
|
if (maybeReportError(resp)) return;
|
||||||
|
|
||||||
|
await utils.scenarioVars.list.invalidate();
|
||||||
setNewVariable("");
|
setNewVariable("");
|
||||||
}, [addVarMutation, experiment.data?.id, newVarIsValid, newVariable]);
|
}, [addVarMutation, experiment.data?.id, newVarIsValid, newVariable]);
|
||||||
|
|
||||||
const deleteMutation = api.templateVars.delete.useMutation();
|
|
||||||
const [onDeleteVar] = useHandledAsyncCallback(async (id: string) => {
|
|
||||||
await deleteMutation.mutateAsync({ id });
|
|
||||||
await utils.templateVars.list.invalidate();
|
|
||||||
}, []);
|
|
||||||
|
|
||||||
return (
|
return (
|
||||||
<Stack>
|
<Stack>
|
||||||
<Heading size="sm">Scenario Variables</Heading>
|
<Heading size="sm">Scenario Variables</Heading>
|
||||||
<Stack spacing={2}>
|
<VStack spacing={4}>
|
||||||
<Text fontSize="sm">
|
<Text fontSize="sm">
|
||||||
Scenario variables can be used in your prompt variants as well as evaluations.
|
Scenario variables can be used in your prompt variants as well as evaluations.
|
||||||
</Text>
|
</Text>
|
||||||
<HStack spacing={0}>
|
<VStack spacing={0} w="full">
|
||||||
<Input
|
{vars.data?.map((variable) => (
|
||||||
placeholder="Add Scenario Variable"
|
<ScenarioVar
|
||||||
size="sm"
|
variable={variable}
|
||||||
borderTopRadius={0}
|
|
||||||
borderRightRadius={0}
|
|
||||||
value={newVariable}
|
|
||||||
onChange={(e) => setNewVariable(e.target.value)}
|
|
||||||
onKeyDown={(e) => {
|
|
||||||
if (e.key === "Enter") {
|
|
||||||
e.preventDefault();
|
|
||||||
onAddVar();
|
|
||||||
}
|
|
||||||
// If the user types a space, replace it with an underscore
|
|
||||||
if (e.key === " ") {
|
|
||||||
e.preventDefault();
|
|
||||||
setNewVariable((v) => v + "_");
|
|
||||||
}
|
|
||||||
}}
|
|
||||||
/>
|
|
||||||
<Button
|
|
||||||
size="xs"
|
|
||||||
height="100%"
|
|
||||||
borderLeftRadius={0}
|
|
||||||
isDisabled={!newVarIsValid}
|
|
||||||
onClick={onAddVar}
|
|
||||||
>
|
|
||||||
<Icon as={BsCheck} boxSize={8} />
|
|
||||||
</Button>
|
|
||||||
</HStack>
|
|
||||||
|
|
||||||
<HStack spacing={2} py={4} wrap="wrap">
|
|
||||||
{vars.map((variable) => (
|
|
||||||
<HStack
|
|
||||||
key={variable.id}
|
key={variable.id}
|
||||||
spacing={0}
|
isEditing={currentlyEditingId === variable.id}
|
||||||
bgColor="blue.100"
|
setIsEditing={(isEditing) => {
|
||||||
color="blue.600"
|
if (isEditing) {
|
||||||
pl={2}
|
setCurrentlyEditingId(variable.id);
|
||||||
pr={0}
|
} else {
|
||||||
fontWeight="bold"
|
setCurrentlyEditingId(null);
|
||||||
>
|
}
|
||||||
<Text fontSize="sm" flex={1}>
|
}}
|
||||||
{variable.label}
|
/>
|
||||||
</Text>
|
|
||||||
<Button
|
|
||||||
size="xs"
|
|
||||||
variant="ghost"
|
|
||||||
colorScheme="blue"
|
|
||||||
p="unset"
|
|
||||||
minW="unset"
|
|
||||||
px="unset"
|
|
||||||
onClick={() => onDeleteVar(variable.id)}
|
|
||||||
>
|
|
||||||
<Icon as={BsX} boxSize={6} color="blue.800" />
|
|
||||||
</Button>
|
|
||||||
</HStack>
|
|
||||||
))}
|
))}
|
||||||
</HStack>
|
</VStack>
|
||||||
</Stack>
|
{currentlyEditingId !== "new" && (
|
||||||
|
<Button
|
||||||
|
colorScheme="blue"
|
||||||
|
size="sm"
|
||||||
|
onClick={() => setCurrentlyEditingId("new")}
|
||||||
|
alignSelf="end"
|
||||||
|
>
|
||||||
|
New Variable
|
||||||
|
</Button>
|
||||||
|
)}
|
||||||
|
{currentlyEditingId === "new" && (
|
||||||
|
<HStack w="full">
|
||||||
|
<FloatingLabelInput
|
||||||
|
flex={1}
|
||||||
|
label="New Variable"
|
||||||
|
value={newVariable}
|
||||||
|
onChange={(e) => setNewVariable(e.target.value)}
|
||||||
|
onKeyDown={(e) => {
|
||||||
|
if (e.key === "Enter") {
|
||||||
|
e.preventDefault();
|
||||||
|
onAddVar();
|
||||||
|
}
|
||||||
|
// If the user types a space, replace it with an underscore
|
||||||
|
if (e.key === " ") {
|
||||||
|
e.preventDefault();
|
||||||
|
setNewVariable((v) => v && `${v}_`);
|
||||||
|
}
|
||||||
|
}}
|
||||||
|
/>
|
||||||
|
<Button size="sm" onClick={() => setCurrentlyEditingId(null)}>
|
||||||
|
Cancel
|
||||||
|
</Button>
|
||||||
|
<Button size="sm" colorScheme="blue" onClick={onAddVar}>
|
||||||
|
Save
|
||||||
|
</Button>
|
||||||
|
</HStack>
|
||||||
|
)}
|
||||||
|
</VStack>
|
||||||
</Stack>
|
</Stack>
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -1,7 +1,7 @@
|
|||||||
import { api } from "~/utils/api";
|
import { api } from "~/utils/api";
|
||||||
import { type PromptVariant, type Scenario } from "../types";
|
import { type PromptVariant, type Scenario } from "../types";
|
||||||
import { type StackProps, Text, VStack } from "@chakra-ui/react";
|
import { type StackProps, Text, VStack } from "@chakra-ui/react";
|
||||||
import { useExperiment, useHandledAsyncCallback } from "~/utils/hooks";
|
import { useScenarioVars, useHandledAsyncCallback } from "~/utils/hooks";
|
||||||
import SyntaxHighlighter from "react-syntax-highlighter";
|
import SyntaxHighlighter from "react-syntax-highlighter";
|
||||||
import { docco } from "react-syntax-highlighter/dist/cjs/styles/hljs";
|
import { docco } from "react-syntax-highlighter/dist/cjs/styles/hljs";
|
||||||
import stringify from "json-stringify-pretty-compact";
|
import stringify from "json-stringify-pretty-compact";
|
||||||
@@ -23,10 +23,7 @@ export default function OutputCell({
|
|||||||
variant: PromptVariant;
|
variant: PromptVariant;
|
||||||
}): ReactElement | null {
|
}): ReactElement | null {
|
||||||
const utils = api.useContext();
|
const utils = api.useContext();
|
||||||
const experiment = useExperiment();
|
const vars = useScenarioVars().data;
|
||||||
const vars = api.templateVars.list.useQuery({
|
|
||||||
experimentId: experiment.data?.id ?? "",
|
|
||||||
}).data;
|
|
||||||
|
|
||||||
const scenarioVariables = scenario.variableValues as Record<string, string>;
|
const scenarioVariables = scenario.variableValues as Record<string, string>;
|
||||||
const templateHasVariables =
|
const templateHasVariables =
|
||||||
@@ -191,7 +188,7 @@ export default function OutputCell({
|
|||||||
|
|
||||||
return (
|
return (
|
||||||
<CellWrapper>
|
<CellWrapper>
|
||||||
<Text>{contentToDisplay}</Text>
|
<Text whiteSpace="pre-wrap">{contentToDisplay}</Text>
|
||||||
</CellWrapper>
|
</CellWrapper>
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -19,8 +19,8 @@ export const OutputStats = ({
|
|||||||
? modelResponse.receivedAt.getTime() - modelResponse.requestedAt.getTime()
|
? modelResponse.receivedAt.getTime() - modelResponse.requestedAt.getTime()
|
||||||
: 0;
|
: 0;
|
||||||
|
|
||||||
const promptTokens = modelResponse.promptTokens;
|
const inputTokens = modelResponse.inputTokens;
|
||||||
const completionTokens = modelResponse.completionTokens;
|
const outputTokens = modelResponse.outputTokens;
|
||||||
|
|
||||||
return (
|
return (
|
||||||
<HStack
|
<HStack
|
||||||
@@ -55,8 +55,8 @@ export const OutputStats = ({
|
|||||||
</HStack>
|
</HStack>
|
||||||
{modelResponse.cost && (
|
{modelResponse.cost && (
|
||||||
<CostTooltip
|
<CostTooltip
|
||||||
promptTokens={promptTokens}
|
inputTokens={inputTokens}
|
||||||
completionTokens={completionTokens}
|
outputTokens={outputTokens}
|
||||||
cost={modelResponse.cost}
|
cost={modelResponse.cost}
|
||||||
>
|
>
|
||||||
<HStack spacing={0}>
|
<HStack spacing={0}>
|
||||||
|
|||||||
@@ -1,7 +1,7 @@
|
|||||||
import { isEqual } from "lodash-es";
|
import { isEqual } from "lodash-es";
|
||||||
import { useEffect, useState, type DragEvent } from "react";
|
import { useEffect, useState, type DragEvent } from "react";
|
||||||
import { api } from "~/utils/api";
|
import { api } from "~/utils/api";
|
||||||
import { useExperiment, useExperimentAccess, useHandledAsyncCallback } from "~/utils/hooks";
|
import { useExperimentAccess, useHandledAsyncCallback, useScenarioVars } from "~/utils/hooks";
|
||||||
import { type Scenario } from "./types";
|
import { type Scenario } from "./types";
|
||||||
|
|
||||||
import {
|
import {
|
||||||
@@ -41,8 +41,7 @@ export default function ScenarioEditor({
|
|||||||
if (savedValues) setValues(savedValues);
|
if (savedValues) setValues(savedValues);
|
||||||
}, [savedValues]);
|
}, [savedValues]);
|
||||||
|
|
||||||
const experiment = useExperiment();
|
const vars = useScenarioVars();
|
||||||
const vars = api.templateVars.list.useQuery({ experimentId: experiment.data?.id ?? "" });
|
|
||||||
|
|
||||||
const variableLabels = vars.data?.map((v) => v.label) ?? [];
|
const variableLabels = vars.data?.map((v) => v.label) ?? [];
|
||||||
|
|
||||||
|
|||||||
@@ -58,7 +58,7 @@ export const ScenarioEditorModal = ({
|
|||||||
await utils.scenarios.list.invalidate();
|
await utils.scenarios.list.invalidate();
|
||||||
}, [mutation, values]);
|
}, [mutation, values]);
|
||||||
|
|
||||||
const vars = api.templateVars.list.useQuery({ experimentId: experiment.data?.id ?? "" });
|
const vars = api.scenarioVars.list.useQuery({ experimentId: experiment.data?.id ?? "" });
|
||||||
const variableLabels = vars.data?.map((v) => v.label) ?? [];
|
const variableLabels = vars.data?.map((v) => v.label) ?? [];
|
||||||
|
|
||||||
return (
|
return (
|
||||||
|
|||||||
@@ -72,7 +72,7 @@ export const ScenariosHeader = () => {
|
|||||||
Autogenerate Scenario
|
Autogenerate Scenario
|
||||||
</MenuItem>
|
</MenuItem>
|
||||||
<MenuItem icon={<BsPencil />} onClick={openDrawer}>
|
<MenuItem icon={<BsPencil />} onClick={openDrawer}>
|
||||||
Edit Vars
|
Add or Remove Variables
|
||||||
</MenuItem>
|
</MenuItem>
|
||||||
</MenuList>
|
</MenuList>
|
||||||
</Menu>
|
</Menu>
|
||||||
|
|||||||
@@ -17,8 +17,8 @@ export default function VariantStats(props: { variant: PromptVariant }) {
|
|||||||
initialData: {
|
initialData: {
|
||||||
evalResults: [],
|
evalResults: [],
|
||||||
overallCost: 0,
|
overallCost: 0,
|
||||||
promptTokens: 0,
|
inputTokens: 0,
|
||||||
completionTokens: 0,
|
outputTokens: 0,
|
||||||
scenarioCount: 0,
|
scenarioCount: 0,
|
||||||
outputCount: 0,
|
outputCount: 0,
|
||||||
awaitingEvals: false,
|
awaitingEvals: false,
|
||||||
@@ -68,8 +68,8 @@ export default function VariantStats(props: { variant: PromptVariant }) {
|
|||||||
</HStack>
|
</HStack>
|
||||||
{data.overallCost && (
|
{data.overallCost && (
|
||||||
<CostTooltip
|
<CostTooltip
|
||||||
promptTokens={data.promptTokens}
|
inputTokens={data.inputTokens}
|
||||||
completionTokens={data.completionTokens}
|
outputTokens={data.outputTokens}
|
||||||
cost={data.overallCost}
|
cost={data.overallCost}
|
||||||
>
|
>
|
||||||
<HStack spacing={0} align="center" color="gray.500">
|
<HStack spacing={0} align="center" color="gray.500">
|
||||||
|
|||||||
@@ -40,8 +40,15 @@ const NavSidebar = () => {
|
|||||||
borderRightWidth={1}
|
borderRightWidth={1}
|
||||||
borderColor="gray.300"
|
borderColor="gray.300"
|
||||||
>
|
>
|
||||||
<HStack as={Link} href="/" _hover={{ textDecoration: "none" }} spacing={0} px={2} py={2}>
|
<HStack
|
||||||
<Image src="/logo.svg" alt="" boxSize={6} mr={4} />
|
as={Link}
|
||||||
|
href="/"
|
||||||
|
_hover={{ textDecoration: "none" }}
|
||||||
|
spacing={{ base: 1, md: 0 }}
|
||||||
|
mx={2}
|
||||||
|
py={{ base: 1, md: 2 }}
|
||||||
|
>
|
||||||
|
<Image src="/logo.svg" alt="" boxSize={6} mr={4} ml={{ base: 0.5, md: 0 }} />
|
||||||
<Heading size="md" fontFamily="inconsolata, monospace">
|
<Heading size="md" fontFamily="inconsolata, monospace">
|
||||||
OpenPipe
|
OpenPipe
|
||||||
</Heading>
|
</Heading>
|
||||||
|
|||||||
@@ -67,7 +67,7 @@ export default function ProjectMenu() {
|
|||||||
>
|
>
|
||||||
PROJECT
|
PROJECT
|
||||||
</Text>
|
</Text>
|
||||||
<Popover placement="right" isOpen={popover.isOpen} onClose={popover.onClose} closeOnBlur>
|
<Popover placement="right-end" isOpen={popover.isOpen} onClose={popover.onClose} closeOnBlur>
|
||||||
<PopoverTrigger>
|
<PopoverTrigger>
|
||||||
<NavSidebarOption>
|
<NavSidebarOption>
|
||||||
<HStack w="full" onClick={popover.onToggle}>
|
<HStack w="full" onClick={popover.onToggle}>
|
||||||
@@ -90,7 +90,7 @@ export default function ProjectMenu() {
|
|||||||
</HStack>
|
</HStack>
|
||||||
</NavSidebarOption>
|
</NavSidebarOption>
|
||||||
</PopoverTrigger>
|
</PopoverTrigger>
|
||||||
<PopoverContent _focusVisible={{ outline: "unset" }} ml={-1}>
|
<PopoverContent _focusVisible={{ outline: "unset" }} ml={-1} w="auto" minW={100} maxW={280}>
|
||||||
<VStack alignItems="flex-start" spacing={2} py={4} px={2}>
|
<VStack alignItems="flex-start" spacing={2} py={4} px={2}>
|
||||||
<Text color="gray.500" fontSize="xs" fontWeight="bold" pb={1}>
|
<Text color="gray.500" fontSize="xs" fontWeight="bold" pb={1}>
|
||||||
PROJECTS
|
PROJECTS
|
||||||
@@ -149,6 +149,8 @@ const ProjectOption = ({
|
|||||||
bgColor={isActive ? "gray.100" : "transparent"}
|
bgColor={isActive ? "gray.100" : "transparent"}
|
||||||
_hover={gearHovered ? undefined : { bgColor: "gray.200", textDecoration: "none" }}
|
_hover={gearHovered ? undefined : { bgColor: "gray.200", textDecoration: "none" }}
|
||||||
p={2}
|
p={2}
|
||||||
|
borderRadius={4}
|
||||||
|
spacing={4}
|
||||||
>
|
>
|
||||||
<Text>{proj.name}</Text>
|
<Text>{proj.name}</Text>
|
||||||
<IconButton
|
<IconButton
|
||||||
|
|||||||
@@ -47,7 +47,7 @@ export default function UserMenu({ user, ...rest }: { user: Session } & StackPro
|
|||||||
</HStack>
|
</HStack>
|
||||||
</NavSidebarOption>
|
</NavSidebarOption>
|
||||||
</PopoverTrigger>
|
</PopoverTrigger>
|
||||||
<PopoverContent _focusVisible={{ outline: "unset" }} ml={-1}>
|
<PopoverContent _focusVisible={{ outline: "unset" }} ml={-1} minW={48} w="full">
|
||||||
<VStack align="stretch" spacing={0}>
|
<VStack align="stretch" spacing={0}>
|
||||||
{/* sign out */}
|
{/* sign out */}
|
||||||
<HStack
|
<HStack
|
||||||
|
|||||||
@@ -2,14 +2,14 @@ import { HStack, Icon, Text, Tooltip, type TooltipProps, VStack, Divider } from
|
|||||||
import { BsCurrencyDollar } from "react-icons/bs";
|
import { BsCurrencyDollar } from "react-icons/bs";
|
||||||
|
|
||||||
type CostTooltipProps = {
|
type CostTooltipProps = {
|
||||||
promptTokens: number | null;
|
inputTokens: number | null;
|
||||||
completionTokens: number | null;
|
outputTokens: number | null;
|
||||||
cost: number;
|
cost: number;
|
||||||
} & TooltipProps;
|
} & TooltipProps;
|
||||||
|
|
||||||
export const CostTooltip = ({
|
export const CostTooltip = ({
|
||||||
promptTokens,
|
inputTokens,
|
||||||
completionTokens,
|
outputTokens,
|
||||||
cost,
|
cost,
|
||||||
children,
|
children,
|
||||||
...props
|
...props
|
||||||
@@ -36,12 +36,12 @@ export const CostTooltip = ({
|
|||||||
<HStack>
|
<HStack>
|
||||||
<VStack w="28" spacing={1}>
|
<VStack w="28" spacing={1}>
|
||||||
<Text>Prompt</Text>
|
<Text>Prompt</Text>
|
||||||
<Text>{promptTokens ?? 0}</Text>
|
<Text>{inputTokens ?? 0}</Text>
|
||||||
</VStack>
|
</VStack>
|
||||||
<Divider borderColor="gray.200" h={8} orientation="vertical" />
|
<Divider borderColor="gray.200" h={8} orientation="vertical" />
|
||||||
<VStack w="28" spacing={1}>
|
<VStack w="28" spacing={1}>
|
||||||
<Text whiteSpace="nowrap">Completion</Text>
|
<Text whiteSpace="nowrap">Completion</Text>
|
||||||
<Text>{completionTokens ?? 0}</Text>
|
<Text>{outputTokens ?? 0}</Text>
|
||||||
</VStack>
|
</VStack>
|
||||||
</HStack>
|
</HStack>
|
||||||
</VStack>
|
</VStack>
|
||||||
|
|||||||
@@ -28,6 +28,10 @@ const modelProvider: AnthropicProvider = {
|
|||||||
inputSchema: inputSchema as JSONSchema4,
|
inputSchema: inputSchema as JSONSchema4,
|
||||||
canStream: true,
|
canStream: true,
|
||||||
getCompletion,
|
getCompletion,
|
||||||
|
getUsage: (input, output) => {
|
||||||
|
// TODO: add usage logic
|
||||||
|
return null;
|
||||||
|
},
|
||||||
...frontendModelProvider,
|
...frontendModelProvider,
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|||||||
@@ -4,11 +4,9 @@ import {
|
|||||||
type ChatCompletion,
|
type ChatCompletion,
|
||||||
type CompletionCreateParams,
|
type CompletionCreateParams,
|
||||||
} from "openai/resources/chat";
|
} from "openai/resources/chat";
|
||||||
import { countOpenAIChatTokens } from "~/utils/countTokens";
|
|
||||||
import { type CompletionResponse } from "../types";
|
import { type CompletionResponse } from "../types";
|
||||||
import { isArray, isString, omit } from "lodash-es";
|
import { isArray, isString, omit } from "lodash-es";
|
||||||
import { openai } from "~/server/utils/openai";
|
import { openai } from "~/server/utils/openai";
|
||||||
import { truthyFilter } from "~/utils/utils";
|
|
||||||
import { APIError } from "openai";
|
import { APIError } from "openai";
|
||||||
import frontendModelProvider from "./frontend";
|
import frontendModelProvider from "./frontend";
|
||||||
import modelProvider, { type SupportedModel } from ".";
|
import modelProvider, { type SupportedModel } from ".";
|
||||||
@@ -60,9 +58,6 @@ export async function getCompletion(
|
|||||||
): Promise<CompletionResponse<ChatCompletion>> {
|
): Promise<CompletionResponse<ChatCompletion>> {
|
||||||
const start = Date.now();
|
const start = Date.now();
|
||||||
let finalCompletion: ChatCompletion | null = null;
|
let finalCompletion: ChatCompletion | null = null;
|
||||||
let promptTokens: number | undefined = undefined;
|
|
||||||
let completionTokens: number | undefined = undefined;
|
|
||||||
const modelName = modelProvider.getModel(input) as SupportedModel;
|
|
||||||
|
|
||||||
try {
|
try {
|
||||||
if (onStream) {
|
if (onStream) {
|
||||||
@@ -86,16 +81,6 @@ export async function getCompletion(
|
|||||||
autoRetry: false,
|
autoRetry: false,
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
try {
|
|
||||||
promptTokens = countOpenAIChatTokens(modelName, input.messages);
|
|
||||||
completionTokens = countOpenAIChatTokens(
|
|
||||||
modelName,
|
|
||||||
finalCompletion.choices.map((c) => c.message).filter(truthyFilter),
|
|
||||||
);
|
|
||||||
} catch (err) {
|
|
||||||
// TODO handle this, library seems like maybe it doesn't work with function calls?
|
|
||||||
console.error(err);
|
|
||||||
}
|
|
||||||
} else {
|
} else {
|
||||||
const resp = await openai.chat.completions.create(
|
const resp = await openai.chat.completions.create(
|
||||||
{ ...input, stream: false },
|
{ ...input, stream: false },
|
||||||
@@ -104,25 +89,14 @@ export async function getCompletion(
|
|||||||
},
|
},
|
||||||
);
|
);
|
||||||
finalCompletion = resp;
|
finalCompletion = resp;
|
||||||
promptTokens = resp.usage?.prompt_tokens ?? 0;
|
|
||||||
completionTokens = resp.usage?.completion_tokens ?? 0;
|
|
||||||
}
|
}
|
||||||
const timeToComplete = Date.now() - start;
|
const timeToComplete = Date.now() - start;
|
||||||
|
|
||||||
const { promptTokenPrice, completionTokenPrice } = frontendModelProvider.models[modelName];
|
|
||||||
let cost = undefined;
|
|
||||||
if (promptTokenPrice && completionTokenPrice && promptTokens && completionTokens) {
|
|
||||||
cost = promptTokens * promptTokenPrice + completionTokens * completionTokenPrice;
|
|
||||||
}
|
|
||||||
|
|
||||||
return {
|
return {
|
||||||
type: "success",
|
type: "success",
|
||||||
statusCode: 200,
|
statusCode: 200,
|
||||||
value: finalCompletion,
|
value: finalCompletion,
|
||||||
timeToComplete,
|
timeToComplete,
|
||||||
promptTokens,
|
|
||||||
completionTokens,
|
|
||||||
cost,
|
|
||||||
};
|
};
|
||||||
} catch (error: unknown) {
|
} catch (error: unknown) {
|
||||||
if (error instanceof APIError) {
|
if (error instanceof APIError) {
|
||||||
|
|||||||
@@ -4,6 +4,8 @@ import inputSchema from "./codegen/input.schema.json";
|
|||||||
import { type ChatCompletion, type CompletionCreateParams } from "openai/resources/chat";
|
import { type ChatCompletion, type CompletionCreateParams } from "openai/resources/chat";
|
||||||
import { getCompletion } from "./getCompletion";
|
import { getCompletion } from "./getCompletion";
|
||||||
import frontendModelProvider from "./frontend";
|
import frontendModelProvider from "./frontend";
|
||||||
|
import { countOpenAIChatTokens } from "~/utils/countTokens";
|
||||||
|
import { truthyFilter } from "~/utils/utils";
|
||||||
|
|
||||||
const supportedModels = [
|
const supportedModels = [
|
||||||
"gpt-4-0613",
|
"gpt-4-0613",
|
||||||
@@ -39,6 +41,41 @@ const modelProvider: OpenaiChatModelProvider = {
|
|||||||
inputSchema: inputSchema as JSONSchema4,
|
inputSchema: inputSchema as JSONSchema4,
|
||||||
canStream: true,
|
canStream: true,
|
||||||
getCompletion,
|
getCompletion,
|
||||||
|
getUsage: (input, output) => {
|
||||||
|
if (output.choices.length === 0) return null;
|
||||||
|
|
||||||
|
const model = modelProvider.getModel(input);
|
||||||
|
if (!model) return null;
|
||||||
|
|
||||||
|
let inputTokens: number;
|
||||||
|
let outputTokens: number;
|
||||||
|
|
||||||
|
if (output.usage) {
|
||||||
|
inputTokens = output.usage.prompt_tokens;
|
||||||
|
outputTokens = output.usage.completion_tokens;
|
||||||
|
} else {
|
||||||
|
try {
|
||||||
|
inputTokens = countOpenAIChatTokens(model, input.messages);
|
||||||
|
outputTokens = countOpenAIChatTokens(
|
||||||
|
model,
|
||||||
|
output.choices.map((c) => c.message).filter(truthyFilter),
|
||||||
|
);
|
||||||
|
} catch (err) {
|
||||||
|
inputTokens = 0;
|
||||||
|
outputTokens = 0;
|
||||||
|
// TODO handle this, library seems like maybe it doesn't work with function calls?
|
||||||
|
console.error(err);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
const { promptTokenPrice, completionTokenPrice } = frontendModelProvider.models[model];
|
||||||
|
let cost = undefined;
|
||||||
|
if (promptTokenPrice && completionTokenPrice && inputTokens && outputTokens) {
|
||||||
|
cost = inputTokens * promptTokenPrice + outputTokens * completionTokenPrice;
|
||||||
|
}
|
||||||
|
|
||||||
|
return { inputTokens: inputTokens, outputTokens: outputTokens, cost };
|
||||||
|
},
|
||||||
...frontendModelProvider,
|
...frontendModelProvider,
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|||||||
@@ -75,6 +75,10 @@ const modelProvider: ReplicateLlama2Provider = {
|
|||||||
},
|
},
|
||||||
canStream: true,
|
canStream: true,
|
||||||
getCompletion,
|
getCompletion,
|
||||||
|
getUsage: (input, output) => {
|
||||||
|
// TODO: add usage logic
|
||||||
|
return null;
|
||||||
|
},
|
||||||
...frontendModelProvider,
|
...frontendModelProvider,
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|||||||
@@ -43,9 +43,6 @@ export type CompletionResponse<T> =
|
|||||||
value: T;
|
value: T;
|
||||||
timeToComplete: number;
|
timeToComplete: number;
|
||||||
statusCode: number;
|
statusCode: number;
|
||||||
promptTokens?: number;
|
|
||||||
completionTokens?: number;
|
|
||||||
cost?: number;
|
|
||||||
};
|
};
|
||||||
|
|
||||||
export type ModelProvider<SupportedModels extends string, InputSchema, OutputSchema> = {
|
export type ModelProvider<SupportedModels extends string, InputSchema, OutputSchema> = {
|
||||||
@@ -56,6 +53,10 @@ export type ModelProvider<SupportedModels extends string, InputSchema, OutputSch
|
|||||||
input: InputSchema,
|
input: InputSchema,
|
||||||
onStream: ((partialOutput: OutputSchema) => void) | null,
|
onStream: ((partialOutput: OutputSchema) => void) | null,
|
||||||
) => Promise<CompletionResponse<OutputSchema>>;
|
) => Promise<CompletionResponse<OutputSchema>>;
|
||||||
|
getUsage: (
|
||||||
|
input: InputSchema,
|
||||||
|
output: OutputSchema,
|
||||||
|
) => { gpuRuntime?: number; inputTokens?: number; outputTokens?: number; cost?: number } | null;
|
||||||
|
|
||||||
// This is just a convenience for type inference, don't use it at runtime
|
// This is just a convenience for type inference, don't use it at runtime
|
||||||
_outputSchema?: OutputSchema | null;
|
_outputSchema?: OutputSchema | null;
|
||||||
|
|||||||
@@ -5,7 +5,6 @@ import {
|
|||||||
type TextProps,
|
type TextProps,
|
||||||
VStack,
|
VStack,
|
||||||
HStack,
|
HStack,
|
||||||
Input,
|
|
||||||
Button,
|
Button,
|
||||||
Divider,
|
Divider,
|
||||||
Icon,
|
Icon,
|
||||||
@@ -21,6 +20,7 @@ import { useHandledAsyncCallback, useSelectedProject } from "~/utils/hooks";
|
|||||||
import ProjectBreadcrumbContents from "~/components/nav/ProjectBreadcrumbContents";
|
import ProjectBreadcrumbContents from "~/components/nav/ProjectBreadcrumbContents";
|
||||||
import CopiableCode from "~/components/CopiableCode";
|
import CopiableCode from "~/components/CopiableCode";
|
||||||
import { DeleteProjectDialog } from "~/components/projectSettings/DeleteProjectDialog";
|
import { DeleteProjectDialog } from "~/components/projectSettings/DeleteProjectDialog";
|
||||||
|
import AutoResizeTextArea from "~/components/AutoResizeTextArea";
|
||||||
|
|
||||||
export default function Settings() {
|
export default function Settings() {
|
||||||
const utils = api.useContext();
|
const utils = api.useContext();
|
||||||
@@ -84,7 +84,7 @@ export default function Settings() {
|
|||||||
<Text fontWeight="bold" fontSize="xl">
|
<Text fontWeight="bold" fontSize="xl">
|
||||||
Display Name
|
Display Name
|
||||||
</Text>
|
</Text>
|
||||||
<Input
|
<AutoResizeTextArea
|
||||||
w="full"
|
w="full"
|
||||||
maxW={600}
|
maxW={600}
|
||||||
value={name}
|
value={name}
|
||||||
@@ -136,10 +136,13 @@ export default function Settings() {
|
|||||||
variant="outline"
|
variant="outline"
|
||||||
borderRadius={4}
|
borderRadius={4}
|
||||||
mt={2}
|
mt={2}
|
||||||
|
height="auto"
|
||||||
onClick={deleteProjectOpen.onOpen}
|
onClick={deleteProjectOpen.onOpen}
|
||||||
>
|
>
|
||||||
<Icon as={BsTrash} />
|
<Icon as={BsTrash} />
|
||||||
<Text>Delete {selectedProject?.name}</Text>
|
<Text overflowWrap="break-word" whiteSpace="normal" py={2}>
|
||||||
|
Delete {selectedProject?.name}
|
||||||
|
</Text>
|
||||||
</HStack>
|
</HStack>
|
||||||
</VStack>
|
</VStack>
|
||||||
)}
|
)}
|
||||||
|
|||||||
@@ -3,7 +3,7 @@ import { createTRPCRouter } from "~/server/api/trpc";
|
|||||||
import { experimentsRouter } from "./routers/experiments.router";
|
import { experimentsRouter } from "./routers/experiments.router";
|
||||||
import { scenariosRouter } from "./routers/scenarios.router";
|
import { scenariosRouter } from "./routers/scenarios.router";
|
||||||
import { scenarioVariantCellsRouter } from "./routers/scenarioVariantCells.router";
|
import { scenarioVariantCellsRouter } from "./routers/scenarioVariantCells.router";
|
||||||
import { templateVarsRouter } from "./routers/templateVariables.router";
|
import { scenarioVarsRouter } from "./routers/scenarioVariables.router";
|
||||||
import { evaluationsRouter } from "./routers/evaluations.router";
|
import { evaluationsRouter } from "./routers/evaluations.router";
|
||||||
import { worldChampsRouter } from "./routers/worldChamps.router";
|
import { worldChampsRouter } from "./routers/worldChamps.router";
|
||||||
import { datasetsRouter } from "./routers/datasets.router";
|
import { datasetsRouter } from "./routers/datasets.router";
|
||||||
@@ -22,7 +22,7 @@ export const appRouter = createTRPCRouter({
|
|||||||
experiments: experimentsRouter,
|
experiments: experimentsRouter,
|
||||||
scenarios: scenariosRouter,
|
scenarios: scenariosRouter,
|
||||||
scenarioVariantCells: scenarioVariantCellsRouter,
|
scenarioVariantCells: scenarioVariantCellsRouter,
|
||||||
templateVars: templateVarsRouter,
|
scenarioVars: scenarioVarsRouter,
|
||||||
evaluations: evaluationsRouter,
|
evaluations: evaluationsRouter,
|
||||||
worldChamps: worldChampsRouter,
|
worldChamps: worldChampsRouter,
|
||||||
datasets: datasetsRouter,
|
datasets: datasetsRouter,
|
||||||
|
|||||||
@@ -3,7 +3,7 @@ import { createTRPCRouter, protectedProcedure, publicProcedure } from "~/server/
|
|||||||
import { prisma } from "~/server/db";
|
import { prisma } from "~/server/db";
|
||||||
import { Prisma } from "@prisma/client";
|
import { Prisma } from "@prisma/client";
|
||||||
import { generateNewCell } from "~/server/utils/generateNewCell";
|
import { generateNewCell } from "~/server/utils/generateNewCell";
|
||||||
import userError from "~/server/utils/error";
|
import { error, success } from "~/utils/standardResponses";
|
||||||
import { recordExperimentUpdated } from "~/server/utils/recordExperimentUpdated";
|
import { recordExperimentUpdated } from "~/server/utils/recordExperimentUpdated";
|
||||||
import { reorderPromptVariants } from "~/server/utils/reorderPromptVariants";
|
import { reorderPromptVariants } from "~/server/utils/reorderPromptVariants";
|
||||||
import { type PromptVariant } from "@prisma/client";
|
import { type PromptVariant } from "@prisma/client";
|
||||||
@@ -123,13 +123,13 @@ export const promptVariantsRouter = createTRPCRouter({
|
|||||||
},
|
},
|
||||||
_sum: {
|
_sum: {
|
||||||
cost: true,
|
cost: true,
|
||||||
promptTokens: true,
|
inputTokens: true,
|
||||||
completionTokens: true,
|
outputTokens: true,
|
||||||
},
|
},
|
||||||
});
|
});
|
||||||
|
|
||||||
const promptTokens = overallTokens._sum?.promptTokens ?? 0;
|
const inputTokens = overallTokens._sum?.inputTokens ?? 0;
|
||||||
const completionTokens = overallTokens._sum?.completionTokens ?? 0;
|
const outputTokens = overallTokens._sum?.outputTokens ?? 0;
|
||||||
|
|
||||||
const awaitingEvals = !!evalResults.find(
|
const awaitingEvals = !!evalResults.find(
|
||||||
(result) => result.totalCount < scenarioCount * evals.length,
|
(result) => result.totalCount < scenarioCount * evals.length,
|
||||||
@@ -137,8 +137,8 @@ export const promptVariantsRouter = createTRPCRouter({
|
|||||||
|
|
||||||
return {
|
return {
|
||||||
evalResults,
|
evalResults,
|
||||||
promptTokens,
|
inputTokens,
|
||||||
completionTokens,
|
outputTokens,
|
||||||
overallCost: overallTokens._sum?.cost ?? 0,
|
overallCost: overallTokens._sum?.cost ?? 0,
|
||||||
scenarioCount,
|
scenarioCount,
|
||||||
outputCount,
|
outputCount,
|
||||||
@@ -315,7 +315,7 @@ export const promptVariantsRouter = createTRPCRouter({
|
|||||||
const constructedPrompt = await parsePromptConstructor(existing.promptConstructor);
|
const constructedPrompt = await parsePromptConstructor(existing.promptConstructor);
|
||||||
|
|
||||||
if ("error" in constructedPrompt) {
|
if ("error" in constructedPrompt) {
|
||||||
return userError(constructedPrompt.error);
|
return error(constructedPrompt.error);
|
||||||
}
|
}
|
||||||
|
|
||||||
const model = input.newModel
|
const model = input.newModel
|
||||||
@@ -353,7 +353,7 @@ export const promptVariantsRouter = createTRPCRouter({
|
|||||||
const parsedPrompt = await parsePromptConstructor(input.promptConstructor);
|
const parsedPrompt = await parsePromptConstructor(input.promptConstructor);
|
||||||
|
|
||||||
if ("error" in parsedPrompt) {
|
if ("error" in parsedPrompt) {
|
||||||
return userError(parsedPrompt.error);
|
return error(parsedPrompt.error);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Create a duplicate with only the config changed
|
// Create a duplicate with only the config changed
|
||||||
@@ -398,7 +398,7 @@ export const promptVariantsRouter = createTRPCRouter({
|
|||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
return { status: "ok" } as const;
|
return success();
|
||||||
}),
|
}),
|
||||||
|
|
||||||
reorder: protectedProcedure
|
reorder: protectedProcedure
|
||||||
|
|||||||
143
app/src/server/api/routers/scenarioVariables.router.ts
Normal file
@@ -0,0 +1,143 @@
|
|||||||
|
import { type TemplateVariable } from "@prisma/client";
|
||||||
|
import { sql } from "kysely";
|
||||||
|
import { z } from "zod";
|
||||||
|
import { createTRPCRouter, protectedProcedure, publicProcedure } from "~/server/api/trpc";
|
||||||
|
import { kysely, prisma } from "~/server/db";
|
||||||
|
import { error, success } from "~/utils/standardResponses";
|
||||||
|
import { requireCanModifyExperiment, requireCanViewExperiment } from "~/utils/accessControl";
|
||||||
|
|
||||||
|
export const scenarioVarsRouter = createTRPCRouter({
|
||||||
|
create: protectedProcedure
|
||||||
|
.input(z.object({ experimentId: z.string(), label: z.string() }))
|
||||||
|
.mutation(async ({ input, ctx }) => {
|
||||||
|
await requireCanModifyExperiment(input.experimentId, ctx);
|
||||||
|
|
||||||
|
// Make sure there isn't an existing variable with the same name
|
||||||
|
const existingVariable = await prisma.templateVariable.findFirst({
|
||||||
|
where: {
|
||||||
|
experimentId: input.experimentId,
|
||||||
|
label: input.label,
|
||||||
|
},
|
||||||
|
});
|
||||||
|
if (existingVariable) {
|
||||||
|
return error(`A variable named ${input.label} already exists.`);
|
||||||
|
}
|
||||||
|
|
||||||
|
await prisma.templateVariable.create({
|
||||||
|
data: {
|
||||||
|
experimentId: input.experimentId,
|
||||||
|
label: input.label,
|
||||||
|
},
|
||||||
|
});
|
||||||
|
|
||||||
|
return success();
|
||||||
|
}),
|
||||||
|
|
||||||
|
rename: protectedProcedure
|
||||||
|
.input(z.object({ id: z.string(), label: z.string() }))
|
||||||
|
.mutation(async ({ input, ctx }) => {
|
||||||
|
const templateVariable = await prisma.templateVariable.findUniqueOrThrow({
|
||||||
|
where: { id: input.id },
|
||||||
|
});
|
||||||
|
await requireCanModifyExperiment(templateVariable.experimentId, ctx);
|
||||||
|
|
||||||
|
// Make sure there isn't an existing variable with the same name
|
||||||
|
const existingVariable = await prisma.templateVariable.findFirst({
|
||||||
|
where: {
|
||||||
|
experimentId: templateVariable.experimentId,
|
||||||
|
label: input.label,
|
||||||
|
},
|
||||||
|
});
|
||||||
|
if (existingVariable) {
|
||||||
|
return error(`A variable named ${input.label} already exists.`);
|
||||||
|
}
|
||||||
|
|
||||||
|
await renameTemplateVariable(templateVariable, input.label);
|
||||||
|
return success();
|
||||||
|
}),
|
||||||
|
|
||||||
|
delete: protectedProcedure
|
||||||
|
.input(z.object({ id: z.string() }))
|
||||||
|
.mutation(async ({ input, ctx }) => {
|
||||||
|
const { experimentId } = await prisma.templateVariable.findUniqueOrThrow({
|
||||||
|
where: { id: input.id },
|
||||||
|
});
|
||||||
|
|
||||||
|
await requireCanModifyExperiment(experimentId, ctx);
|
||||||
|
|
||||||
|
await prisma.templateVariable.delete({ where: { id: input.id } });
|
||||||
|
}),
|
||||||
|
|
||||||
|
list: publicProcedure
|
||||||
|
.input(z.object({ experimentId: z.string() }))
|
||||||
|
.query(async ({ input, ctx }) => {
|
||||||
|
await requireCanViewExperiment(input.experimentId, ctx);
|
||||||
|
return await prisma.templateVariable.findMany({
|
||||||
|
where: {
|
||||||
|
experimentId: input.experimentId,
|
||||||
|
},
|
||||||
|
orderBy: {
|
||||||
|
createdAt: "asc",
|
||||||
|
},
|
||||||
|
select: {
|
||||||
|
id: true,
|
||||||
|
label: true,
|
||||||
|
},
|
||||||
|
});
|
||||||
|
}),
|
||||||
|
});
|
||||||
|
|
||||||
|
export const renameTemplateVariable = async (
|
||||||
|
templateVariable: TemplateVariable,
|
||||||
|
newLabel: string,
|
||||||
|
) => {
|
||||||
|
const { experimentId } = templateVariable;
|
||||||
|
|
||||||
|
await kysely.transaction().execute(async (trx) => {
|
||||||
|
await trx
|
||||||
|
.updateTable("TemplateVariable")
|
||||||
|
.set({
|
||||||
|
label: newLabel,
|
||||||
|
})
|
||||||
|
.where("id", "=", templateVariable.id)
|
||||||
|
.execute();
|
||||||
|
|
||||||
|
await sql`
|
||||||
|
CREATE TEMP TABLE "TempTestScenario" AS
|
||||||
|
SELECT *
|
||||||
|
FROM "TestScenario"
|
||||||
|
WHERE "experimentId" = ${experimentId}
|
||||||
|
|
||||||
|
-- Only copy the rows that actually have a value for the variable, no reason to churn the rest and simplifies the update.
|
||||||
|
AND "variableValues"->${templateVariable.label} IS NOT NULL
|
||||||
|
`.execute(trx);
|
||||||
|
|
||||||
|
await sql`
|
||||||
|
UPDATE "TempTestScenario"
|
||||||
|
SET "variableValues" = jsonb_set(
|
||||||
|
"variableValues",
|
||||||
|
${`{${newLabel}}`},
|
||||||
|
"variableValues"->${templateVariable.label}
|
||||||
|
) - ${templateVariable.label},
|
||||||
|
"updatedAt" = NOW(),
|
||||||
|
"id" = uuid_generate_v4()
|
||||||
|
`.execute(trx);
|
||||||
|
|
||||||
|
// Print the contents of the temp table
|
||||||
|
const results = await sql`SELECT * FROM "TempTestScenario"`.execute(trx);
|
||||||
|
console.log(results.rows);
|
||||||
|
|
||||||
|
await trx
|
||||||
|
.updateTable("TestScenario")
|
||||||
|
.set({
|
||||||
|
visible: false,
|
||||||
|
})
|
||||||
|
.where("experimentId", "=", experimentId)
|
||||||
|
.execute();
|
||||||
|
|
||||||
|
await sql`
|
||||||
|
INSERT INTO "TestScenario" (id, "variableValues", "uiId", visible, "sortIndex", "experimentId", "createdAt", "updatedAt")
|
||||||
|
SELECT * FROM "TempTestScenario";
|
||||||
|
`.execute(trx);
|
||||||
|
});
|
||||||
|
};
|
||||||
110
app/src/server/api/routers/templateVariables.router.test.ts
Normal file
@@ -0,0 +1,110 @@
|
|||||||
|
import { expect, it } from "vitest";
|
||||||
|
import { prisma } from "~/server/db";
|
||||||
|
import { renameTemplateVariable } from "./scenarioVariables.router";
|
||||||
|
|
||||||
|
const createExperiment = async () => {
|
||||||
|
return await prisma.experiment.create({
|
||||||
|
data: {
|
||||||
|
label: "Test Experiment",
|
||||||
|
project: {
|
||||||
|
create: {},
|
||||||
|
},
|
||||||
|
},
|
||||||
|
});
|
||||||
|
};
|
||||||
|
|
||||||
|
const createTemplateVar = async (experimentId: string, label: string) => {
|
||||||
|
return await prisma.templateVariable.create({
|
||||||
|
data: {
|
||||||
|
experimentId,
|
||||||
|
label,
|
||||||
|
},
|
||||||
|
});
|
||||||
|
};
|
||||||
|
|
||||||
|
it("renames templateVariables", async () => {
|
||||||
|
// Create experiments concurrently
|
||||||
|
const [exp1, exp2] = await Promise.all([createExperiment(), createExperiment()]);
|
||||||
|
|
||||||
|
// Create template variables concurrently
|
||||||
|
const [exp1Var, exp2Var1, exp2Var2] = await Promise.all([
|
||||||
|
createTemplateVar(exp1.id, "input1"),
|
||||||
|
createTemplateVar(exp2.id, "input1"),
|
||||||
|
createTemplateVar(exp2.id, "input2"),
|
||||||
|
]);
|
||||||
|
|
||||||
|
// Create test scenarios concurrently
|
||||||
|
const [exp1Scenario, exp2Scenario, exp2HiddenScenario] = await Promise.all([
|
||||||
|
prisma.testScenario.create({
|
||||||
|
data: {
|
||||||
|
experimentId: exp1.id,
|
||||||
|
visible: true,
|
||||||
|
variableValues: { input1: "test" },
|
||||||
|
},
|
||||||
|
}),
|
||||||
|
prisma.testScenario.create({
|
||||||
|
data: {
|
||||||
|
experimentId: exp2.id,
|
||||||
|
visible: true,
|
||||||
|
variableValues: { input1: "test1", otherInput: "otherTest" },
|
||||||
|
},
|
||||||
|
}),
|
||||||
|
prisma.testScenario.create({
|
||||||
|
data: {
|
||||||
|
experimentId: exp2.id,
|
||||||
|
visible: false,
|
||||||
|
variableValues: { otherInput: "otherTest2" },
|
||||||
|
},
|
||||||
|
}),
|
||||||
|
]);
|
||||||
|
|
||||||
|
await renameTemplateVariable(exp2Var1, "input1-renamed");
|
||||||
|
|
||||||
|
expect(await prisma.templateVariable.findUnique({ where: { id: exp2Var1.id } })).toMatchObject({
|
||||||
|
label: "input1-renamed",
|
||||||
|
});
|
||||||
|
|
||||||
|
// It shouldn't mess with unrelated experiments
|
||||||
|
expect(await prisma.testScenario.findUnique({ where: { id: exp1Scenario.id } })).toMatchObject({
|
||||||
|
visible: true,
|
||||||
|
variableValues: { input1: "test" },
|
||||||
|
});
|
||||||
|
|
||||||
|
// Make sure there are a total of 4 scenarios for exp2
|
||||||
|
expect(
|
||||||
|
await prisma.testScenario.count({
|
||||||
|
where: {
|
||||||
|
experimentId: exp2.id,
|
||||||
|
},
|
||||||
|
}),
|
||||||
|
).toBe(3);
|
||||||
|
|
||||||
|
// It shouldn't mess with the existing scenarios, except to hide them
|
||||||
|
expect(await prisma.testScenario.findUnique({ where: { id: exp2Scenario.id } })).toMatchObject({
|
||||||
|
visible: false,
|
||||||
|
variableValues: { input1: "test1", otherInput: "otherTest" },
|
||||||
|
});
|
||||||
|
|
||||||
|
// It should create a new scenario with the new variable name
|
||||||
|
const newScenario1 = await prisma.testScenario.findFirst({
|
||||||
|
where: {
|
||||||
|
experimentId: exp2.id,
|
||||||
|
variableValues: { equals: { "input1-renamed": "test1", otherInput: "otherTest" } },
|
||||||
|
},
|
||||||
|
});
|
||||||
|
|
||||||
|
expect(newScenario1).toMatchObject({
|
||||||
|
visible: true,
|
||||||
|
});
|
||||||
|
|
||||||
|
const newScenario2 = await prisma.testScenario.findFirst({
|
||||||
|
where: {
|
||||||
|
experimentId: exp2.id,
|
||||||
|
variableValues: { equals: { otherInput: "otherTest2" } },
|
||||||
|
},
|
||||||
|
});
|
||||||
|
|
||||||
|
expect(newScenario2).toMatchObject({
|
||||||
|
visible: false,
|
||||||
|
});
|
||||||
|
});
|
||||||
@@ -1,49 +0,0 @@
|
|||||||
import { z } from "zod";
|
|
||||||
import { createTRPCRouter, protectedProcedure, publicProcedure } from "~/server/api/trpc";
|
|
||||||
import { prisma } from "~/server/db";
|
|
||||||
import { requireCanModifyExperiment, requireCanViewExperiment } from "~/utils/accessControl";
|
|
||||||
|
|
||||||
export const templateVarsRouter = createTRPCRouter({
|
|
||||||
create: protectedProcedure
|
|
||||||
.input(z.object({ experimentId: z.string(), label: z.string() }))
|
|
||||||
.mutation(async ({ input, ctx }) => {
|
|
||||||
await requireCanModifyExperiment(input.experimentId, ctx);
|
|
||||||
|
|
||||||
await prisma.templateVariable.create({
|
|
||||||
data: {
|
|
||||||
experimentId: input.experimentId,
|
|
||||||
label: input.label,
|
|
||||||
},
|
|
||||||
});
|
|
||||||
}),
|
|
||||||
|
|
||||||
delete: protectedProcedure
|
|
||||||
.input(z.object({ id: z.string() }))
|
|
||||||
.mutation(async ({ input, ctx }) => {
|
|
||||||
const { experimentId } = await prisma.templateVariable.findUniqueOrThrow({
|
|
||||||
where: { id: input.id },
|
|
||||||
});
|
|
||||||
|
|
||||||
await requireCanModifyExperiment(experimentId, ctx);
|
|
||||||
|
|
||||||
await prisma.templateVariable.delete({ where: { id: input.id } });
|
|
||||||
}),
|
|
||||||
|
|
||||||
list: publicProcedure
|
|
||||||
.input(z.object({ experimentId: z.string() }))
|
|
||||||
.query(async ({ input, ctx }) => {
|
|
||||||
await requireCanViewExperiment(input.experimentId, ctx);
|
|
||||||
return await prisma.templateVariable.findMany({
|
|
||||||
where: {
|
|
||||||
experimentId: input.experimentId,
|
|
||||||
},
|
|
||||||
orderBy: {
|
|
||||||
createdAt: "asc",
|
|
||||||
},
|
|
||||||
select: {
|
|
||||||
id: true,
|
|
||||||
label: true,
|
|
||||||
},
|
|
||||||
});
|
|
||||||
}),
|
|
||||||
});
|
|
||||||
@@ -1,63 +0,0 @@
|
|||||||
import dayjs from "dayjs";
|
|
||||||
import { prisma } from "../db";
|
|
||||||
|
|
||||||
const projectId = "1234";
|
|
||||||
|
|
||||||
// Find all calls in the last 24 hours
|
|
||||||
const responses = await prisma.loggedCall.findMany({
|
|
||||||
where: {
|
|
||||||
projectId: projectId,
|
|
||||||
startTime: {
|
|
||||||
gt: dayjs()
|
|
||||||
.subtract(24 * 3600)
|
|
||||||
.toDate(),
|
|
||||||
},
|
|
||||||
},
|
|
||||||
include: {
|
|
||||||
modelResponse: true,
|
|
||||||
},
|
|
||||||
orderBy: {
|
|
||||||
startTime: "desc",
|
|
||||||
},
|
|
||||||
});
|
|
||||||
|
|
||||||
// Find all calls in the last 24 hours with promptId 'hello-world'
|
|
||||||
const helloWorld = await prisma.loggedCall.findMany({
|
|
||||||
where: {
|
|
||||||
projectId: projectId,
|
|
||||||
startTime: {
|
|
||||||
gt: dayjs()
|
|
||||||
.subtract(24 * 3600)
|
|
||||||
.toDate(),
|
|
||||||
},
|
|
||||||
tags: {
|
|
||||||
some: {
|
|
||||||
name: "promptId",
|
|
||||||
value: "hello-world",
|
|
||||||
},
|
|
||||||
},
|
|
||||||
},
|
|
||||||
include: {
|
|
||||||
modelResponse: true,
|
|
||||||
},
|
|
||||||
orderBy: {
|
|
||||||
startTime: "desc",
|
|
||||||
},
|
|
||||||
});
|
|
||||||
|
|
||||||
// Total spent on OpenAI in the last month
|
|
||||||
const totalSpent = await prisma.loggedCallModelResponse.aggregate({
|
|
||||||
_sum: {
|
|
||||||
totalCost: true,
|
|
||||||
},
|
|
||||||
where: {
|
|
||||||
originalLoggedCall: {
|
|
||||||
projectId: projectId,
|
|
||||||
},
|
|
||||||
startTime: {
|
|
||||||
gt: dayjs()
|
|
||||||
.subtract(30 * 24 * 3600)
|
|
||||||
.toDate(),
|
|
||||||
},
|
|
||||||
},
|
|
||||||
});
|
|
||||||
@@ -110,15 +110,16 @@ export const queryModel = defineTask<QueryModelJob>("queryModel", async (task) =
|
|||||||
});
|
});
|
||||||
const response = await provider.getCompletion(prompt.modelInput, onStream);
|
const response = await provider.getCompletion(prompt.modelInput, onStream);
|
||||||
if (response.type === "success") {
|
if (response.type === "success") {
|
||||||
|
const usage = provider.getUsage(prompt.modelInput, response.value);
|
||||||
modelResponse = await prisma.modelResponse.update({
|
modelResponse = await prisma.modelResponse.update({
|
||||||
where: { id: modelResponse.id },
|
where: { id: modelResponse.id },
|
||||||
data: {
|
data: {
|
||||||
output: response.value as Prisma.InputJsonObject,
|
output: response.value as Prisma.InputJsonObject,
|
||||||
statusCode: response.statusCode,
|
statusCode: response.statusCode,
|
||||||
receivedAt: new Date(),
|
receivedAt: new Date(),
|
||||||
promptTokens: response.promptTokens,
|
inputTokens: usage?.inputTokens,
|
||||||
completionTokens: response.completionTokens,
|
outputTokens: usage?.outputTokens,
|
||||||
cost: response.cost,
|
cost: usage?.cost,
|
||||||
},
|
},
|
||||||
});
|
});
|
||||||
|
|
||||||
|
|||||||
@@ -1,6 +0,0 @@
|
|||||||
export default function userError(message: string): { status: "error"; message: string } {
|
|
||||||
return {
|
|
||||||
status: "error",
|
|
||||||
message,
|
|
||||||
};
|
|
||||||
}
|
|
||||||
13
app/src/state/persist.ts
Normal file
@@ -0,0 +1,13 @@
|
|||||||
|
import { type PersistOptions } from "zustand/middleware/persist";
|
||||||
|
import { type State } from "./store";
|
||||||
|
|
||||||
|
export const stateToPersist = {
|
||||||
|
selectedProjectId: null as string | null,
|
||||||
|
};
|
||||||
|
|
||||||
|
export const persistOptions: PersistOptions<State, typeof stateToPersist> = {
|
||||||
|
name: "persisted-app-store",
|
||||||
|
partialize: (state) => ({
|
||||||
|
selectedProjectId: state.selectedProjectId,
|
||||||
|
}),
|
||||||
|
};
|
||||||
@@ -8,9 +8,9 @@ export const editorBackground = "#fafafa";
|
|||||||
export type SharedVariantEditorSlice = {
|
export type SharedVariantEditorSlice = {
|
||||||
monaco: null | ReturnType<typeof loader.__getMonacoInstance>;
|
monaco: null | ReturnType<typeof loader.__getMonacoInstance>;
|
||||||
loadMonaco: () => Promise<void>;
|
loadMonaco: () => Promise<void>;
|
||||||
scenarios: RouterOutputs["scenarios"]["list"]["scenarios"];
|
scenarioVars: RouterOutputs["scenarioVars"]["list"];
|
||||||
updateScenariosModel: () => void;
|
updateScenariosModel: () => void;
|
||||||
setScenarios: (scenarios: RouterOutputs["scenarios"]["list"]["scenarios"]) => void;
|
setScenarioVars: (scenarioVars: RouterOutputs["scenarioVars"]["list"]) => void;
|
||||||
};
|
};
|
||||||
|
|
||||||
export const createVariantEditorSlice: SliceCreator<SharedVariantEditorSlice> = (set, get) => ({
|
export const createVariantEditorSlice: SliceCreator<SharedVariantEditorSlice> = (set, get) => ({
|
||||||
@@ -60,10 +60,10 @@ export const createVariantEditorSlice: SliceCreator<SharedVariantEditorSlice> =
|
|||||||
});
|
});
|
||||||
get().sharedVariantEditor.updateScenariosModel();
|
get().sharedVariantEditor.updateScenariosModel();
|
||||||
},
|
},
|
||||||
scenarios: [],
|
scenarioVars: [],
|
||||||
setScenarios: (scenarios) => {
|
setScenarioVars: (scenarios) => {
|
||||||
set((state) => {
|
set((state) => {
|
||||||
state.sharedVariantEditor.scenarios = scenarios;
|
state.sharedVariantEditor.scenarioVars = scenarios;
|
||||||
});
|
});
|
||||||
|
|
||||||
get().sharedVariantEditor.updateScenariosModel();
|
get().sharedVariantEditor.updateScenariosModel();
|
||||||
@@ -73,17 +73,16 @@ export const createVariantEditorSlice: SliceCreator<SharedVariantEditorSlice> =
|
|||||||
const monaco = get().sharedVariantEditor.monaco;
|
const monaco = get().sharedVariantEditor.monaco;
|
||||||
if (!monaco) return;
|
if (!monaco) return;
|
||||||
|
|
||||||
const modelContents = `
|
const modelContents = `
|
||||||
const scenarios = ${JSON.stringify(
|
declare var scenario: {
|
||||||
get().sharedVariantEditor.scenarios.map((s) => s.variableValues),
|
${get()
|
||||||
null,
|
.sharedVariantEditor.scenarioVars.map((s) => `${s.label}: string;`)
|
||||||
2,
|
.join("\n")}
|
||||||
)} as const;
|
};
|
||||||
|
|
||||||
type Scenario = typeof scenarios[number];
|
|
||||||
declare var scenario: Scenario | { [key: string]: string };
|
|
||||||
`;
|
`;
|
||||||
|
|
||||||
|
console.log(modelContents);
|
||||||
|
|
||||||
const scenariosModel = monaco.editor.getModel(monaco.Uri.parse("file:///scenarios.ts"));
|
const scenariosModel = monaco.editor.getModel(monaco.Uri.parse("file:///scenarios.ts"));
|
||||||
|
|
||||||
if (scenariosModel) {
|
if (scenariosModel) {
|
||||||
|
|||||||
@@ -1,11 +1,13 @@
|
|||||||
import { type StateCreator, create } from "zustand";
|
import { type StateCreator, create } from "zustand";
|
||||||
import { immer } from "zustand/middleware/immer";
|
import { immer } from "zustand/middleware/immer";
|
||||||
|
import { persist } from "zustand/middleware";
|
||||||
import { createSelectors } from "./createSelectors";
|
import { createSelectors } from "./createSelectors";
|
||||||
import {
|
import {
|
||||||
type SharedVariantEditorSlice,
|
type SharedVariantEditorSlice,
|
||||||
createVariantEditorSlice,
|
createVariantEditorSlice,
|
||||||
} from "./sharedVariantEditor.slice";
|
} from "./sharedVariantEditor.slice";
|
||||||
import { type APIClient } from "~/utils/api";
|
import { type APIClient } from "~/utils/api";
|
||||||
|
import { persistOptions, type stateToPersist } from "./persist";
|
||||||
|
|
||||||
export type State = {
|
export type State = {
|
||||||
drawerOpen: boolean;
|
drawerOpen: boolean;
|
||||||
@@ -23,30 +25,36 @@ export type SliceCreator<T> = StateCreator<State, [["zustand/immer", never]], []
|
|||||||
export type SetFn = Parameters<SliceCreator<unknown>>[0];
|
export type SetFn = Parameters<SliceCreator<unknown>>[0];
|
||||||
export type GetFn = Parameters<SliceCreator<unknown>>[1];
|
export type GetFn = Parameters<SliceCreator<unknown>>[1];
|
||||||
|
|
||||||
const useBaseStore = create<State, [["zustand/immer", never]]>(
|
const useBaseStore = create<
|
||||||
immer((set, get, ...rest) => ({
|
State,
|
||||||
api: null,
|
[["zustand/persist", typeof stateToPersist], ["zustand/immer", never]]
|
||||||
setApi: (api) =>
|
>(
|
||||||
set((state) => {
|
persist(
|
||||||
state.api = api;
|
immer((set, get, ...rest) => ({
|
||||||
}),
|
api: null,
|
||||||
|
setApi: (api) =>
|
||||||
|
set((state) => {
|
||||||
|
state.api = api;
|
||||||
|
}),
|
||||||
|
|
||||||
drawerOpen: false,
|
drawerOpen: false,
|
||||||
openDrawer: () =>
|
openDrawer: () =>
|
||||||
set((state) => {
|
set((state) => {
|
||||||
state.drawerOpen = true;
|
state.drawerOpen = true;
|
||||||
}),
|
}),
|
||||||
closeDrawer: () =>
|
closeDrawer: () =>
|
||||||
set((state) => {
|
set((state) => {
|
||||||
state.drawerOpen = false;
|
state.drawerOpen = false;
|
||||||
}),
|
}),
|
||||||
sharedVariantEditor: createVariantEditorSlice(set, get, ...rest),
|
sharedVariantEditor: createVariantEditorSlice(set, get, ...rest),
|
||||||
selectedProjectId: null,
|
selectedProjectId: null,
|
||||||
setselectedProjectId: (id: string) =>
|
setselectedProjectId: (id: string) =>
|
||||||
set((state) => {
|
set((state) => {
|
||||||
state.selectedProjectId = id;
|
state.selectedProjectId = id;
|
||||||
}),
|
}),
|
||||||
})),
|
})),
|
||||||
|
persistOptions,
|
||||||
|
),
|
||||||
);
|
);
|
||||||
|
|
||||||
export const useAppStore = createSelectors(useBaseStore);
|
export const useAppStore = createSelectors(useBaseStore);
|
||||||
|
|||||||
@@ -1,16 +1,16 @@
|
|||||||
import { useEffect } from "react";
|
import { useEffect } from "react";
|
||||||
import { api } from "~/utils/api";
|
import { api } from "~/utils/api";
|
||||||
import { useScenarios } from "~/utils/hooks";
|
import { useScenarioVars } from "~/utils/hooks";
|
||||||
import { useAppStore } from "./store";
|
import { useAppStore } from "./store";
|
||||||
|
|
||||||
export function useSyncVariantEditor() {
|
export function useSyncVariantEditor() {
|
||||||
const scenarios = useScenarios();
|
const scenarioVars = useScenarioVars();
|
||||||
|
|
||||||
useEffect(() => {
|
useEffect(() => {
|
||||||
if (scenarios.data) {
|
if (scenarioVars.data) {
|
||||||
useAppStore.getState().sharedVariantEditor.setScenarios(scenarios.data.scenarios);
|
useAppStore.getState().sharedVariantEditor.setScenarioVars(scenarioVars.data);
|
||||||
}
|
}
|
||||||
}, [scenarios.data]);
|
}, [scenarioVars.data]);
|
||||||
}
|
}
|
||||||
|
|
||||||
export function SyncAppStore() {
|
export function SyncAppStore() {
|
||||||
|
|||||||
5
app/src/tests/helpers/loadEnv.ts
Normal file
@@ -0,0 +1,5 @@
|
|||||||
|
import { configDotenv } from "dotenv";
|
||||||
|
|
||||||
|
configDotenv({
|
||||||
|
path: ".env.test",
|
||||||
|
});
|
||||||
13
app/src/tests/helpers/setup.ts
Normal file
@@ -0,0 +1,13 @@
|
|||||||
|
import "./loadEnv";
|
||||||
|
import { sql } from "kysely";
|
||||||
|
import { beforeEach } from "vitest";
|
||||||
|
import { kysely } from "~/server/db";
|
||||||
|
|
||||||
|
// Reset all Prisma data
|
||||||
|
const resetDb = async () => {
|
||||||
|
await sql`truncate "Experiment" cascade;`.execute(kysely);
|
||||||
|
};
|
||||||
|
|
||||||
|
beforeEach(async () => {
|
||||||
|
await resetDb();
|
||||||
|
});
|
||||||
@@ -1,4 +1,9 @@
|
|||||||
import { extendTheme, defineStyleConfig, ChakraProvider } from "@chakra-ui/react";
|
import {
|
||||||
|
extendTheme,
|
||||||
|
defineStyleConfig,
|
||||||
|
ChakraProvider,
|
||||||
|
createStandaloneToast,
|
||||||
|
} from "@chakra-ui/react";
|
||||||
import "@fontsource/inconsolata";
|
import "@fontsource/inconsolata";
|
||||||
import { modalAnatomy } from "@chakra-ui/anatomy";
|
import { modalAnatomy } from "@chakra-ui/anatomy";
|
||||||
import { createMultiStyleConfigHelpers } from "@chakra-ui/styled-system";
|
import { createMultiStyleConfigHelpers } from "@chakra-ui/styled-system";
|
||||||
@@ -63,6 +68,15 @@ const theme = extendTheme({
|
|||||||
},
|
},
|
||||||
});
|
});
|
||||||
|
|
||||||
|
const { ToastContainer, toast } = createStandaloneToast(theme);
|
||||||
|
|
||||||
|
export { toast };
|
||||||
|
|
||||||
export const ChakraThemeProvider = ({ children }: { children: JSX.Element }) => {
|
export const ChakraThemeProvider = ({ children }: { children: JSX.Element }) => {
|
||||||
return <ChakraProvider theme={theme}>{children}</ChakraProvider>;
|
return (
|
||||||
|
<ChakraProvider theme={theme}>
|
||||||
|
<ToastContainer />
|
||||||
|
{children}
|
||||||
|
</ChakraProvider>
|
||||||
|
);
|
||||||
};
|
};
|
||||||
|
|||||||
@@ -157,3 +157,12 @@ export const useSelectedProject = () => {
|
|||||||
{ enabled: !!selectedProjectId },
|
{ enabled: !!selectedProjectId },
|
||||||
);
|
);
|
||||||
};
|
};
|
||||||
|
|
||||||
|
export const useScenarioVars = () => {
|
||||||
|
const experiment = useExperiment();
|
||||||
|
|
||||||
|
return api.scenarioVars.list.useQuery(
|
||||||
|
{ experimentId: experiment.data?.id ?? "" },
|
||||||
|
{ enabled: experiment.data?.id != null },
|
||||||
|
);
|
||||||
|
};
|
||||||
|
|||||||
31
app/src/utils/standardResponses.ts
Normal file
@@ -0,0 +1,31 @@
|
|||||||
|
import { toast } from "~/theme/ChakraThemeProvider";
|
||||||
|
|
||||||
|
export function error(message: string): { status: "error"; message: string } {
|
||||||
|
return {
|
||||||
|
status: "error",
|
||||||
|
message,
|
||||||
|
};
|
||||||
|
}
|
||||||
|
export function success<T>(payload: T): { status: "success"; payload: T };
|
||||||
|
export function success(payload?: undefined): { status: "success"; payload: undefined };
|
||||||
|
export function success<T>(payload?: T) {
|
||||||
|
return { status: "success", payload };
|
||||||
|
}
|
||||||
|
|
||||||
|
type SuccessType<T> = ReturnType<typeof success<T>>;
|
||||||
|
type ErrorType = ReturnType<typeof error>;
|
||||||
|
|
||||||
|
// Used client-side to report generic errors
|
||||||
|
export function maybeReportError<T>(response: SuccessType<T> | ErrorType): response is ErrorType {
|
||||||
|
if (response.status === "error") {
|
||||||
|
toast({
|
||||||
|
description: response.message,
|
||||||
|
status: "error",
|
||||||
|
duration: 5000,
|
||||||
|
isClosable: true,
|
||||||
|
});
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
return false;
|
||||||
|
}
|
||||||
@@ -4,6 +4,10 @@ import { configDefaults, defineConfig, type UserConfig } from "vitest/config";
|
|||||||
const config = defineConfig({
|
const config = defineConfig({
|
||||||
test: {
|
test: {
|
||||||
...configDefaults, // Extending Vitest's default options
|
...configDefaults, // Extending Vitest's default options
|
||||||
|
setupFiles: ["./src/tests/helpers/setup.ts"],
|
||||||
|
|
||||||
|
// Unfortunately using threads seems to cause issues with isolated-vm
|
||||||
|
threads: false,
|
||||||
},
|
},
|
||||||
plugins: [tsconfigPaths()],
|
plugins: [tsconfigPaths()],
|
||||||
}) as UserConfig;
|
}) as UserConfig;
|
||||||
|
|||||||