Dagger
Search

evaluator

No long description provided.

Installation

dagger install github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7

Entrypoint

Return Type
Evaluator !
Arguments
NameTypeDefault ValueDescription
docsFile -The documentation for the tool calling scheme to generate a prompt for.
initialPromptFile -An initial system prompt to evaluate and use as a starting point.
modelString -Model to use for the evaluator agent.
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
func (m *MyModule) Example() *dagger.Evaluator  {
	return dag.
			Evaluator()
}
@function
def example() -> dagger.Evaluator:
	return (
		dag.evaluator()
	)
@func()
example(): Evaluator {
	return dag
		.evaluator()
}

Types

Evaluator 🔗

docs() 🔗

Return Type
File !
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 docs
func (m *MyModule) Example() *dagger.File  {
	return dag.
			Evaluator().
			Docs()
}
@function
def example() -> dagger.File:
	return (
		dag.evaluator()
		.docs()
	)
@func()
example(): File {
	return dag
		.evaluator()
		.docs()
}

initialPrompt() 🔗

Return Type
File !
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 initial-prompt
func (m *MyModule) Example() *dagger.File  {
	return dag.
			Evaluator().
			InitialPrompt()
}
@function
def example() -> dagger.File:
	return (
		dag.evaluator()
		.initial_prompt()
	)
@func()
example(): File {
	return dag
		.evaluator()
		.initialPrompt()
}

evaluatorModel() 🔗

Return Type
String !
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 evaluator-model
func (m *MyModule) Example(ctx context.Context) string  {
	return dag.
			Evaluator().
			EvaluatorModel(ctx)
}
@function
async def example() -> str:
	return await (
		dag.evaluator()
		.evaluator_model()
	)
@func()
async example(): Promise<string> {
	return dag
		.evaluator()
		.evaluatorModel()
}

withEval() 🔗

Return Type
Evaluator !
Arguments
NameTypeDefault ValueDescription
evalInterface !-No description provided
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 with-eval
func (m *MyModule) Example(eval ) *dagger.Evaluator  {
	return dag.
			Evaluator().
			WithEval(eval)
}
@function
def example(eval: ) -> dagger.Evaluator:
	return (
		dag.evaluator()
		.with_eval(eval)
	)
@func()
example(eval: ): Evaluator {
	return dag
		.evaluator()
		.withEval(eval)
}

withEvals() 🔗

Return Type
Evaluator !
Arguments
NameTypeDefault ValueDescription
evals[Interface ! ] !-No description provided
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 with-evals
func (m *MyModule) Example(evals []) *dagger.Evaluator  {
	return dag.
			Evaluator().
			WithEvals(evals)
}
@function
def example(evals: List[]) -> dagger.Evaluator:
	return (
		dag.evaluator()
		.with_evals(evals)
	)
@func()
example(evals: []): Evaluator {
	return dag
		.evaluator()
		.withEvals(evals)
}

evalsAcrossModels() 🔗

Run evals across models.

Models run in parallel, and evals run in series, with all attempts in parallel.

Return Type
EvalsAcrossModels !
Arguments
NameTypeDefault ValueDescription
evals[String ! ] -Evals to run. Defaults to all.
models[String ! ] -Models to run evals across. Defaults to all.
attemptsInteger -Attempts to run each eval. Defaults to a per-provider value.
systemPromptFile -A system prompt to use.
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 evals-across-models
func (m *MyModule) Example() *dagger.EvaluatorEvalsAcrossModels  {
	return dag.
			Evaluator().
			EvalsAcrossModels()
}
@function
def example() -> dagger.EvaluatorEvalsAcrossModels:
	return (
		dag.evaluator()
		.evals_across_models()
	)
@func()
example(): EvaluatorEvalsAcrossModels {
	return dag
		.evaluator()
		.evalsAcrossModels()
}

systemPrompt() 🔗

Return Type
String !
Arguments
NameTypeDefault ValueDescription
evalNameString -Run a particular eval, instead of leaving it open-ended.
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 system-prompt
func (m *MyModule) Example(ctx context.Context) string  {
	return dag.
			Evaluator().
			SystemPrompt(ctx)
}
@function
async def example() -> str:
	return await (
		dag.evaluator()
		.system_prompt()
	)
@func()
async example(): Promise<string> {
	return dag
		.evaluator()
		.systemPrompt()
}

explore() 🔗

Return Type
[String ! ] !
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 explore
func (m *MyModule) Example(ctx context.Context) []string  {
	return dag.
			Evaluator().
			Explore(ctx)
}
@function
async def example() -> List[str]:
	return await (
		dag.evaluator()
		.explore()
	)
@func()
async example(): Promise<string[]> {
	return dag
		.evaluator()
		.explore()
}

generateSystemPrompt() 🔗

Return Type
String !
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 generate-system-prompt
func (m *MyModule) Example(ctx context.Context) string  {
	return dag.
			Evaluator().
			GenerateSystemPrompt(ctx)
}
@function
async def example() -> str:
	return await (
		dag.evaluator()
		.generate_system_prompt()
	)
@func()
async example(): Promise<string> {
	return dag
		.evaluator()
		.generateSystemPrompt()
}

evaluate() 🔗

Return Type
String !
Arguments
NameTypeDefault ValueDescription
modelString !-No description provided
nameString !-No description provided
attemptsInteger !0No description provided
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 evaluate --model string --name string --attempts integer
func (m *MyModule) Example(ctx context.Context, model string, name string, attempts int) string  {
	return dag.
			Evaluator().
			Evaluate(ctx, model, name, attempts)
}
@function
async def example(model: str, name: str, attempts: int) -> str:
	return await (
		dag.evaluator()
		.evaluate(model, name, attempts)
	)
@func()
async example(model: string, name: string, attempts: number): Promise<string> {
	return dag
		.evaluator()
		.evaluate(model, name, attempts)
}

iterate() 🔗

Iterate continuously runs evals across all models.

Return Type
String !
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 iterate
func (m *MyModule) Example(ctx context.Context) string  {
	return dag.
			Evaluator().
			Iterate(ctx)
}
@function
async def example() -> str:
	return await (
		dag.evaluator()
		.iterate()
	)
@func()
async example(): Promise<string> {
	return dag
		.evaluator()
		.iterate()
}

compare() 🔗

Return Type
String !
Arguments
NameTypeDefault ValueDescription
beforeFile !-No description provided
afterFile !-No description provided
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 compare --before file:path --after file:path
func (m *MyModule) Example(ctx context.Context, before *dagger.File, after *dagger.File) string  {
	return dag.
			Evaluator().
			Compare(ctx, before, after)
}
@function
async def example(before: dagger.File, after: dagger.File) -> str:
	return await (
		dag.evaluator()
		.compare(before, after)
	)
@func()
async example(before: File, after: File): Promise<string> {
	return dag
		.evaluator()
		.compare(before, after)
}

EvalsAcrossModels 🔗

traceId() 🔗

Return Type
String !
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 evals-across-models \
 trace-id
func (m *MyModule) Example(ctx context.Context) string  {
	return dag.
			Evaluator().
			EvalsAcrossModels().
			TraceId(ctx)
}
@function
async def example() -> str:
	return await (
		dag.evaluator()
		.evals_across_models()
		.trace_id()
	)
@func()
async example(): Promise<string> {
	return dag
		.evaluator()
		.evalsAcrossModels()
		.traceId()
}

modelResults() 🔗

Return Type
[ModelResult ! ] !
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 evals-across-models \
 model-results
func (m *MyModule) Example() []*dagger.EvaluatorModelResult  {
	return dag.
			Evaluator().
			EvalsAcrossModels().
			ModelResults()
}
@function
def example() -> List[dagger.EvaluatorModelResult]:
	return (
		dag.evaluator()
		.evals_across_models()
		.model_results()
	)
@func()
example(): EvaluatorModelResult[] {
	return dag
		.evaluator()
		.evalsAcrossModels()
		.modelResults()
}

check() 🔗

Return Type
Void !
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 evals-across-models \
 check
func (m *MyModule) Example(ctx context.Context)   {
	return dag.
			Evaluator().
			EvalsAcrossModels().
			Check(ctx)
}
@function
async def example() -> None:
	return await (
		dag.evaluator()
		.evals_across_models()
		.check()
	)
@func()
async example(): Promise<void> {
	return dag
		.evaluator()
		.evalsAcrossModels()
		.check()
}

csv() 🔗

Return Type
String !
Arguments
NameTypeDefault ValueDescription
noHeaderBoolean !falseDon't include a header.
Example
dagger -m github.com/dagger/dagger/modules/evaluator@89166d06f037ebdf273caaba4ca2976f86d4e9c7 call \
 evals-across-models \
 csv --no-header boolean
func (m *MyModule) Example(ctx context.Context, noHeader bool) string  {
	return dag.
			Evaluator().
			EvalsAcrossModels().
			Csv(ctx, noHeader)
}
@function
async def example(no_header: bool) -> str:
	return await (
		dag.evaluator()
		.evals_across_models()
		.csv(no_header)
	)
@func()
async example(noHeader: boolean): Promise<string> {
	return dag
		.evaluator()
		.evalsAcrossModels()
		.csv(noHeader)
}

ModelResult 🔗

modelName() 🔗

Return Type
String !
Example
Function EvaluatorModelResult.modelName is not accessible from the evaluator module
Function EvaluatorModelResult.modelName is not accessible from the evaluator module
Function EvaluatorModelResult.modelName is not accessible from the evaluator module
Function EvaluatorModelResult.modelName is not accessible from the evaluator module

spanId() 🔗

Return Type
String !
Example
Function EvaluatorModelResult.spanId is not accessible from the evaluator module
Function EvaluatorModelResult.spanId is not accessible from the evaluator module
Function EvaluatorModelResult.spanId is not accessible from the evaluator module
Function EvaluatorModelResult.spanId is not accessible from the evaluator module

evalReports() 🔗

Return Type
[EvalResult ! ] !
Example
Function EvaluatorModelResult.evalReports is not accessible from the evaluator module
Function EvaluatorModelResult.evalReports is not accessible from the evaluator module
Function EvaluatorModelResult.evalReports is not accessible from the evaluator module
Function EvaluatorModelResult.evalReports is not accessible from the evaluator module

check() 🔗

Return Type
Void !
Example
Function EvaluatorModelResult.check is not accessible from the evaluator module
Function EvaluatorModelResult.check is not accessible from the evaluator module
Function EvaluatorModelResult.check is not accessible from the evaluator module
Function EvaluatorModelResult.check is not accessible from the evaluator module

EvalResult 🔗

name() 🔗

Return Type
String !
Example
Function EvaluatorEvalResult.name is not accessible from the evaluator module
Function EvaluatorEvalResult.name is not accessible from the evaluator module
Function EvaluatorEvalResult.name is not accessible from the evaluator module
Function EvaluatorEvalResult.name is not accessible from the evaluator module

spanId() 🔗

Return Type
String !
Example
Function EvaluatorEvalResult.spanId is not accessible from the evaluator module
Function EvaluatorEvalResult.spanId is not accessible from the evaluator module
Function EvaluatorEvalResult.spanId is not accessible from the evaluator module
Function EvaluatorEvalResult.spanId is not accessible from the evaluator module

error() 🔗

Return Type
String !
Example
Function EvaluatorEvalResult.error is not accessible from the evaluator module
Function EvaluatorEvalResult.error is not accessible from the evaluator module
Function EvaluatorEvalResult.error is not accessible from the evaluator module
Function EvaluatorEvalResult.error is not accessible from the evaluator module

report() 🔗

Return Type
String !
Example
Function EvaluatorEvalResult.report is not accessible from the evaluator module
Function EvaluatorEvalResult.report is not accessible from the evaluator module
Function EvaluatorEvalResult.report is not accessible from the evaluator module
Function EvaluatorEvalResult.report is not accessible from the evaluator module

successRate() 🔗

Return Type
Float !
Example
Function EvaluatorEvalResult.successRate is not accessible from the evaluator module
Function EvaluatorEvalResult.successRate is not accessible from the evaluator module
Function EvaluatorEvalResult.successRate is not accessible from the evaluator module
Function EvaluatorEvalResult.successRate is not accessible from the evaluator module

totalAttempts() 🔗

Return Type
Integer !
Example
Function EvaluatorEvalResult.totalAttempts is not accessible from the evaluator module
Function EvaluatorEvalResult.totalAttempts is not accessible from the evaluator module
Function EvaluatorEvalResult.totalAttempts is not accessible from the evaluator module
Function EvaluatorEvalResult.totalAttempts is not accessible from the evaluator module

inputTokens() 🔗

Return Type
Integer !
Example
Function EvaluatorEvalResult.inputTokens is not accessible from the evaluator module
Function EvaluatorEvalResult.inputTokens is not accessible from the evaluator module
Function EvaluatorEvalResult.inputTokens is not accessible from the evaluator module
Function EvaluatorEvalResult.inputTokens is not accessible from the evaluator module

outputTokens() 🔗

Return Type
Integer !
Example
Function EvaluatorEvalResult.outputTokens is not accessible from the evaluator module
Function EvaluatorEvalResult.outputTokens is not accessible from the evaluator module
Function EvaluatorEvalResult.outputTokens is not accessible from the evaluator module
Function EvaluatorEvalResult.outputTokens is not accessible from the evaluator module

check() 🔗

Return Type
Void !
Example
Function EvaluatorEvalResult.check is not accessible from the evaluator module
Function EvaluatorEvalResult.check is not accessible from the evaluator module
Function EvaluatorEvalResult.check is not accessible from the evaluator module
Function EvaluatorEvalResult.check is not accessible from the evaluator module