diff --git a/agenta-web/src/components/EvaluationTable/ABTestingEvaluationTable.tsx b/agenta-web/src/components/EvaluationTable/ABTestingEvaluationTable.tsx index 1d5651738f..b1610a4aa9 100644 --- a/agenta-web/src/components/EvaluationTable/ABTestingEvaluationTable.tsx +++ b/agenta-web/src/components/EvaluationTable/ABTestingEvaluationTable.tsx @@ -387,7 +387,13 @@ const ABTestingEvaluationTable: React.FC = ({ Run All exportABTestingEvaluationData(evaluation, rows)} + onClick={() => + exportABTestingEvaluationData( + evaluation, + evaluationScenarios, + rows, + ) + } disabled={false} > Export results diff --git a/agenta-web/src/components/EvaluationTable/SingleModelEvaluationTable.tsx b/agenta-web/src/components/EvaluationTable/SingleModelEvaluationTable.tsx index 6154060c01..8b731dad74 100644 --- a/agenta-web/src/components/EvaluationTable/SingleModelEvaluationTable.tsx +++ b/agenta-web/src/components/EvaluationTable/SingleModelEvaluationTable.tsx @@ -454,7 +454,13 @@ const SingleModelEvaluationTable: React.FC = ({ Run All exportSingleModelEvaluationData(evaluation, rows)} + onClick={() => + exportSingleModelEvaluationData( + evaluation, + evaluationScenarios, + rows, + ) + } disabled={false} > Export results diff --git a/agenta-web/src/lib/helpers/evaluate.ts b/agenta-web/src/lib/helpers/evaluate.ts index fb1b932da6..c4ce8f95b1 100644 --- a/agenta-web/src/lib/helpers/evaluate.ts +++ b/agenta-web/src/lib/helpers/evaluate.ts @@ -1,13 +1,24 @@ import {HumanEvaluationListTableDataType} from "@/components/Evaluations/HumanEvaluationResult" -import {Evaluation, GenericObject, Variant} from "../Types" +import {Evaluation, EvaluationScenario, GenericObject, Variant} from "../Types" import {convertToCsv, downloadCsv} from "./fileManipulations" -export const exportABTestingEvaluationData = (evaluation: Evaluation, rows: GenericObject[]) => { +export const exportABTestingEvaluationData = ( + evaluation: Evaluation, + scenarios: EvaluationScenario[], + rows: GenericObject[], +) => { const exportRow = rows.map((data, ix) => { + const inputColumns = evaluation.testset.testsetChatColumn + ? {Input: evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn]} + : data.inputs.reduce( + (columns: any, input: {input_name: string; input_value: string}) => { + columns[`${input.input_name}`] = input.input_value + return columns + }, + {}, + ) return { - ["Inputs"]: - evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn] || - data.inputs[0].input_value, + ...inputColumns, [`App Variant ${evaluation.variants[0].variantName} Output 0`]: data?.columnData0 ? data?.columnData0 : data.outputs[0]?.variant_output, @@ -17,6 +28,9 @@ export const exportABTestingEvaluationData = (evaluation: Evaluation, rows: Gene ["Vote"]: evaluation.variants.find((v: Variant) => v.variantId === data.vote)?.variantName || data.vote, + ["Expected answer"]: + scenarios[ix]?.correctAnswer || evaluation.testset.csvdata[ix].correct_answer, + ["Additional notes"]: scenarios[ix]?.note, } }) const exportCol = Object.keys(exportRow[0]) @@ -26,17 +40,31 @@ export const exportABTestingEvaluationData = (evaluation: Evaluation, rows: Gene downloadCsv(csvData, filename) } -export const exportSingleModelEvaluationData = (evaluation: Evaluation, rows: GenericObject[]) => { +export const exportSingleModelEvaluationData = ( + evaluation: Evaluation, + scenarios: EvaluationScenario[], + rows: GenericObject[], +) => { const exportRow = rows.map((data, ix) => { + const inputColumns = evaluation.testset.testsetChatColumn + ? {Input: evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn]} + : data.inputs.reduce( + (columns: any, input: {input_name: string; input_value: string}) => { + columns[`${input.input_name}`] = input.input_value + return columns + }, + {}, + ) const numericScore = parseInt(data.score) return { - ["Inputs"]: - evaluation.testset.csvdata[ix]?.[evaluation.testset.testsetChatColumn] || - data.inputs[0].input_value, + ...inputColumns, [`App Variant ${evaluation.variants[0].variantName} Output 0`]: data?.columnData0 ? data?.columnData0 : data.outputs[0]?.variant_output, ["Score"]: isNaN(numericScore) ? "-" : numericScore, + ["Expected answer"]: + scenarios[ix]?.correctAnswer || evaluation.testset.csvdata[ix].correct_answer, + ["Additional notes"]: scenarios[ix]?.note, } }) const exportCol = Object.keys(exportRow[0])