agsamantha/node_modules/langsmith/dist/evaluation/evaluator.js

95 lines
3.2 KiB
JavaScript
Raw Normal View History

2024-10-02 20:15:21 +00:00
import { v4 as uuidv4 } from "uuid";
import { traceable } from "../traceable.js";
/**
* Wraps an evaluator function + implements the RunEvaluator interface.
*/
export class DynamicRunEvaluator {
constructor(evaluator) {
Object.defineProperty(this, "func", {
enumerable: true,
configurable: true,
writable: true,
value: void 0
});
this.func = ((input) => {
const { run, example } = input.langSmithRunAndExample;
return evaluator(run, example);
});
}
isEvaluationResults(x) {
return (typeof x === "object" &&
x != null &&
"results" in x &&
Array.isArray(x.results) &&
x.results.length > 0);
}
coerceEvaluationResults(results, sourceRunId) {
if (this.isEvaluationResults(results)) {
return {
results: results.results.map((r) => this.coerceEvaluationResult(r, sourceRunId, false)),
};
}
return this.coerceEvaluationResult(results, sourceRunId, true);
}
coerceEvaluationResult(result, sourceRunId, allowNoKey = false) {
if ("key" in result) {
if (!result.sourceRunId) {
result.sourceRunId = sourceRunId;
}
return result;
}
if (!("key" in result)) {
if (allowNoKey) {
result["key"] = this.func.name;
}
}
return {
sourceRunId,
...result,
};
}
/**
* Evaluates a run with an optional example and returns the evaluation result.
* @param run The run to evaluate.
* @param example The optional example to use for evaluation.
* @returns A promise that extracts to the evaluation result.
*/
async evaluateRun(run, example, options) {
const sourceRunId = uuidv4();
const metadata = {
targetRunId: run.id,
};
if ("session_id" in run) {
metadata["experiment"] = run.session_id;
}
if (typeof this.func !== "function") {
throw new Error("Target must be runnable function");
}
const wrappedTraceableFunc = traceable(this.func, {
project_name: "evaluators",
name: "evaluator",
id: sourceRunId,
...options,
});
const result = (await wrappedTraceableFunc(
// Pass data via `langSmithRunAndExample` key to avoid conflicts with other
// inputs. This key is extracted in the wrapped function, with `run` and
// `example` passed to evaluator function as arguments.
{ langSmithRunAndExample: { run, example } }, { metadata }));
// Check the one required property of EvaluationResult since 'instanceof' is not possible
if ("key" in result) {
if (!result.sourceRunId) {
result.sourceRunId = sourceRunId;
}
return result;
}
if (typeof result !== "object") {
throw new Error("Evaluator function must return an object.");
}
return this.coerceEvaluationResults(result, sourceRunId);
}
}
export function runEvaluator(func) {
return new DynamicRunEvaluator(func);
}