Skip to content

Commit

Permalink
Merge branch 'gh/vision-gpt-llm-app-temp' of https://github.com/Agent…
Browse files Browse the repository at this point in the history
…a-AI/agenta into feat/file-input-support-playground
  • Loading branch information
MohammedMaaz committed Dec 1, 2023
2 parents cc39449 + 521d2e8 commit 9caa502
Show file tree
Hide file tree
Showing 14 changed files with 128 additions and 27 deletions.
9 changes: 9 additions & 0 deletions .all-contributorsrc
Original file line number Diff line number Diff line change
Expand Up @@ -345,6 +345,15 @@
"contributions": [
"code"
]
},
{
"login": "brockWith",
"name": "brockWith",
"avatar_url": "https://avatars.githubusercontent.com/u/105627491?v=4",
"profile": "https://github.com/brockWith",
"contributions": [
"code"
]
}
],
"contributorsPerLine": 7,
Expand Down
3 changes: 2 additions & 1 deletion README.md
Original file line number Diff line number Diff line change
Expand Up @@ -231,7 +231,7 @@ Check out our [Contributing Guide](https://docs.agenta.ai/contributing/getting-s
## Contributors ✨

<!-- ALL-CONTRIBUTORS-BADGE:START - Do not remove or modify this section -->
[![All Contributors](https://img.shields.io/badge/all_contributors-36-orange.svg?style=flat-square)](#contributors-)
[![All Contributors](https://img.shields.io/badge/all_contributors-37-orange.svg?style=flat-square)](#contributors-)
<!-- ALL-CONTRIBUTORS-BADGE:END -->

Thanks goes to these wonderful people ([emoji key](https://allcontributors.org/docs/en/emoji-key)):
Expand Down Expand Up @@ -288,6 +288,7 @@ Thanks goes to these wonderful people ([emoji key](https://allcontributors.org/d
</tr>
<tr>
<td align="center" valign="top" width="14.28%"><a href="https://diegolikescode.me/"><img src="https://avatars.githubusercontent.com/u/57499868?v=4?s=100" width="100px;" alt="diego"/><br /><sub><b>diego</b></sub></a><br /><a href="https://github.com/Agenta-AI/agenta/commits?author=diegolikescode" title="Code">💻</a></td>
<td align="center" valign="top" width="14.28%"><a href="https://github.com/brockWith"><img src="https://avatars.githubusercontent.com/u/105627491?v=4?s=100" width="100px;" alt="brockWith"/><br /><sub><b>brockWith</b></sub></a><br /><a href="https://github.com/Agenta-AI/agenta/commits?author=brockWith" title="Code">💻</a></td>
</tr>
</tbody>
</table>
Expand Down
4 changes: 2 additions & 2 deletions agenta-web/prod.Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -12,8 +12,8 @@ COPY public ./public
COPY next.config.js .
COPY tsconfig.json .
COPY postcss.config.js .
COPY .env .
# used in cloud
COPY .env.production .
# used in cloud
COPY sentry.* .
# Build the Next.js app for production
RUN npm run build
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@ import {createUseStyles} from "react-jss"
import {exportAICritiqueEvaluationData} from "@/lib/helpers/evaluate"
import SecondaryButton from "../SecondaryButton/SecondaryButton"
import {useAppTheme} from "../Layout/ThemeContextProvider"
import {testsetRowToChatMessages} from "@/lib/helpers/testset"
import {contentToChatMessageString, testsetRowToChatMessages} from "@/lib/helpers/testset"

const {Title} = Typography

Expand Down Expand Up @@ -257,6 +257,7 @@ Answer ONLY with one of the given grading or evaluation options.
? testsetRowToChatMessages(evaluation.testset.csvdata[rowIndex], false)
: [],
)
if (variantData[idx].isChatVariant) result = contentToChatMessageString(result)

setRowValue(rowIndex, columnName as any, result)
await evaluate(rowIndex)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,7 @@ import {createUseStyles} from "react-jss"
import SecondaryButton from "../SecondaryButton/SecondaryButton"
import {exportCustomCodeEvaluationData} from "@/lib/helpers/evaluate"
import CodeBlock from "../DynamicCodeBlock/CodeBlock"
import {testsetRowToChatMessages} from "@/lib/helpers/testset"
import {contentToChatMessageString, testsetRowToChatMessages} from "@/lib/helpers/testset"

const {Title} = Typography

Expand Down Expand Up @@ -251,6 +251,7 @@ const CustomCodeRunEvaluationTable: React.FC<CustomCodeEvaluationTableProps> = (
? testsetRowToChatMessages(evaluation.testset.csvdata[rowIndex], false)
: [],
)
if (variantData[idx].isChatVariant) result = contentToChatMessageString(result)

setRowValue(rowIndex, columnName as any, result)
await evaluate(rowIndex)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,7 @@ import {evaluateWithExactMatch} from "@/lib/services/evaluations"
import {createUseStyles} from "react-jss"
import {exportExactEvaluationData} from "@/lib/helpers/evaluate"
import SecondaryButton from "../SecondaryButton/SecondaryButton"
import {testsetRowToChatMessages} from "@/lib/helpers/testset"
import {contentToChatMessageString, testsetRowToChatMessages} from "@/lib/helpers/testset"
import {Evaluation} from "@/lib/Types"

const {Title} = Typography
Expand Down Expand Up @@ -198,6 +198,7 @@ const ExactMatchEvaluationTable: React.FC<ExactMatchEvaluationTableProps> = ({
? testsetRowToChatMessages(evaluation.testset.csvdata[rowIndex], false)
: [],
)
if (variantData[idx].isChatVariant) result = contentToChatMessageString(result)

setRowValue(rowIndex, columnName, result)
setRowValue(rowIndex, "evaluationFlow", EvaluationFlow.COMPARISON_RUN_STARTED)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,7 @@ import {globalErrorHandler} from "@/lib/helpers/errorHandler"
import SecondaryButton from "../SecondaryButton/SecondaryButton"
import {exportRegexEvaluationData} from "@/lib/helpers/evaluate"
import {isValidRegex} from "@/lib/helpers/validators"
import {testsetRowToChatMessages} from "@/lib/helpers/testset"
import {contentToChatMessageString, testsetRowToChatMessages} from "@/lib/helpers/testset"

const {Title} = Typography

Expand Down Expand Up @@ -227,6 +227,7 @@ const RegexEvaluationTable: React.FC<RegexEvaluationTableProps> = ({
? testsetRowToChatMessages(evaluation.testset.csvdata[rowIndex], false)
: [],
)
if (variantData[idx].isChatVariant) result = contentToChatMessageString(result)

const {regexPattern, regexShouldMatch} = form.getFieldsValue()
const isCorrect = evaluateWithRegex(result, regexPattern, regexShouldMatch)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ import {Typography} from "antd"
import {createUseStyles} from "react-jss"
import {exportSimilarityEvaluationData} from "@/lib/helpers/evaluate"
import SecondaryButton from "../SecondaryButton/SecondaryButton"
import {testsetRowToChatMessages} from "@/lib/helpers/testset"
import {contentToChatMessageString, testsetRowToChatMessages} from "@/lib/helpers/testset"

const {Title} = Typography

Expand Down Expand Up @@ -223,6 +223,7 @@ const SimilarityMatchEvaluationTable: React.FC<SimilarityMatchEvaluationTablePro
? testsetRowToChatMessages(evaluation.testset.csvdata[rowIndex], false)
: [],
)
if (variantData[idx].isChatVariant) result = contentToChatMessageString(result)

const {similarityThreshold} = form.getFieldsValue()
const similarity = evaluateWithSimilarityMatch(result, rows[rowIndex].correctAnswer)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,7 @@ import {globalErrorHandler} from "@/lib/helpers/errorHandler"
import {isValidUrl} from "@/lib/helpers/validators"
import SecondaryButton from "../SecondaryButton/SecondaryButton"
import {exportWebhookEvaluationData} from "@/lib/helpers/evaluate"
import {testsetRowToChatMessages} from "@/lib/helpers/testset"
import {contentToChatMessageString, testsetRowToChatMessages} from "@/lib/helpers/testset"

const {Title} = Typography

Expand Down Expand Up @@ -206,6 +206,7 @@ const WebhookEvaluationTable: React.FC<WebhookEvaluationTableProps> = ({
? testsetRowToChatMessages(evaluation.testset.csvdata[rowIndex], false)
: [],
)
if (variantData[idx].isChatVariant) result = contentToChatMessageString(result)

const {webhookUrl} = form.getFieldsValue()
const score = await evaluateWithWebhook(webhookUrl, {
Expand Down
10 changes: 10 additions & 0 deletions agenta-web/src/lib/helpers/axiosConfig.ts
Original file line number Diff line number Diff line change
@@ -1,5 +1,7 @@
import axiosApi from "axios"
import {getErrorMessage, globalErrorHandler} from "./errorHandler"
import {signOut} from "supertokens-auth-react/recipe/thirdpartypasswordless"
import router from "next/router"

const axios = axiosApi.create({
headers: {
Expand All @@ -20,6 +22,14 @@ axios.interceptors.response.use(
}`
error.message = msg

if (error.response?.status === 401) {
signOut()
.then(() => {
router.push("/auth")
})
.catch(console.error)
}

globalErrorHandler(error)

throw error
Expand Down
52 changes: 34 additions & 18 deletions agenta-web/src/lib/helpers/evaluate.ts
Original file line number Diff line number Diff line change
Expand Up @@ -2,10 +2,12 @@ import {HumanEvaluationListTableDataType} from "@/components/Evaluations/HumanEv
import {Evaluation, GenericObject, Variant} from "../Types"
import {convertToCsv, downloadCsv} from "./utils"

export const exportExactEvaluationData = (evaluation: any, rows: any[]) => {
const exportRow = rows.map((data) => {
export const exportExactEvaluationData = (evaluation: Evaluation, rows: GenericObject[]) => {
const exportRow = rows.map((data, ix) => {
return {
["Inputs"]: data.inputs[0].input_value,
["Inputs"]:
evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn] ||
data.inputs[0].input_value,
[`App Variant ${evaluation.variants[0].variantName} Output`]: data?.columnData0
? data?.columnData0
: data.outputs[0]?.variant_output,
Expand All @@ -20,10 +22,12 @@ export const exportExactEvaluationData = (evaluation: any, rows: any[]) => {
downloadCsv(csvData, filename)
}

export const exportSimilarityEvaluationData = (evaluation: any, rows: any[]) => {
const exportRow = rows.map((data) => {
export const exportSimilarityEvaluationData = (evaluation: Evaluation, rows: GenericObject[]) => {
const exportRow = rows.map((data, ix) => {
return {
["Inputs"]: data.inputs[0].input_value,
["Inputs"]:
evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn] ||
data.inputs[0].input_value,
[`App Variant ${evaluation.variants[0].variantName} Output`]: data?.columnData0
? data?.columnData0
: data.outputs[0]?.variant_output,
Expand All @@ -39,10 +43,12 @@ export const exportSimilarityEvaluationData = (evaluation: any, rows: any[]) =>
downloadCsv(csvData, filename)
}

export const exportAICritiqueEvaluationData = (evaluation: any, rows: any[]) => {
const exportRow = rows.map((data) => {
export const exportAICritiqueEvaluationData = (evaluation: Evaluation, rows: GenericObject[]) => {
const exportRow = rows.map((data, ix) => {
return {
["Inputs"]: data.inputs[0].input_value,
["Inputs"]:
evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn] ||
data.inputs[0].input_value,
[`App Variant ${evaluation.variants[0].variantName} Output`]: data?.columnData0
? data?.columnData0
: data.outputs[0]?.variant_output,
Expand Down Expand Up @@ -101,13 +107,19 @@ export const exportSingleModelEvaluationData = (evaluation: Evaluation, rows: Ge
downloadCsv(csvData, filename)
}

export const exportRegexEvaluationData = (evaluation: any, rows: any[], settings: any) => {
const exportRow = rows.map((data) => {
export const exportRegexEvaluationData = (
evaluation: Evaluation,
rows: GenericObject[],
settings: GenericObject,
) => {
const exportRow = rows.map((data, ix) => {
const isCorrect = data.score === "correct"
const isMatch = settings.regexShouldMatch ? isCorrect : !isCorrect

return {
["Inputs"]: data.inputs[0].input_value,
["Inputs"]:
evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn] ||
data.inputs[0].input_value,
[`App Variant ${evaluation.variants[0].variantName} Output`]: data?.columnData0
? data?.columnData0
: data.outputs[0]?.variant_output,
Expand All @@ -122,10 +134,12 @@ export const exportRegexEvaluationData = (evaluation: any, rows: any[], settings
downloadCsv(csvData, filename)
}

export const exportWebhookEvaluationData = (evaluation: any, rows: any[]) => {
const exportRow = rows.map((data) => {
export const exportWebhookEvaluationData = (evaluation: Evaluation, rows: GenericObject[]) => {
const exportRow = rows.map((data, ix) => {
return {
["Inputs"]: data.inputs[0].input_value,
["Inputs"]:
evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn] ||
data.inputs[0].input_value,
[`App Variant ${evaluation.variants[0].variantName} Output`]: data?.columnData0
? data?.columnData0
: data.outputs[0]?.variant_output,
Expand All @@ -140,10 +154,12 @@ export const exportWebhookEvaluationData = (evaluation: any, rows: any[]) => {
downloadCsv(csvData, filename)
}

export const exportCustomCodeEvaluationData = (evaluation: any, rows: any[]) => {
const exportRow = rows.map((data) => {
export const exportCustomCodeEvaluationData = (evaluation: Evaluation, rows: GenericObject[]) => {
const exportRow = rows.map((data, ix) => {
return {
["Inputs"]: data.inputs[0].input_value,
["Inputs"]:
evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn] ||
data.inputs[0].input_value,
[`App Variant ${evaluation.variants[0].variantName} Output`]: data?.columnData0
? data?.columnData0
: data.outputs[0]?.variant_output,
Expand Down
7 changes: 7 additions & 0 deletions agenta-web/src/lib/helpers/testset.ts
Original file line number Diff line number Diff line change
Expand Up @@ -52,3 +52,10 @@ export function testsetRowToChatMessages(rowData: KeyValuePair, includeCorrectAn

return chat
}

export function contentToChatMessageString(content: string, role: ChatRole = ChatRole.Assistant) {
return JSON.stringify({
content,
role,
})
}
50 changes: 50 additions & 0 deletions examples/vision_gpt_explain_image/app.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,50 @@
import agenta as ag
from openai import OpenAI


client = OpenAI()


SYSTEM_PROMPT = "You are an expert in reading images you look into details, you answer in accurate language."
HUMAN_PROMPT = "Please compare two images"

ag.init(app_name="explain_image", base_name="app")
ag.config.default(
temperature=ag.FloatParam(0.5, 0, 1),
max_tokens=ag.IntParam(300, 1, 4000),
prompt_system=ag.TextParam(SYSTEM_PROMPT),
prompt_human=ag.TextParam(HUMAN_PROMPT),
)


@ag.entrypoint
def explain(
image_one: ag.FileInputURL,
image_two: ag.FileInputURL,
) -> str:
messages = [{"role": "system", "content": ag.config.prompt_system}] + [
{
"role": "user",
"content": [
{"type": "text", "text": ag.config.prompt_human},
{
"type": "image_url",
"image_url": {
"url": image_one,
},
},
{
"type": "image_url",
"image_url": {
"url": image_two,
},
},
],
}
]
chat_completion = client.chat.completions.create(
model="gpt-4-vision-preview",
messages=messages,
max_tokens=max_tokens,
)
return chat_completion.choices[0].message.content
2 changes: 2 additions & 0 deletions examples/vision_gpt_explain_image/requirements.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
agenta
openai

0 comments on commit 9caa502

Please sign in to comment.