evals
No long description provided.
Installation
dagger install github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48Entrypoint
Return Type
Evals Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
func (m *MyModule) Example() *dagger.Evals {
return dag.
Evals()
}@function
def example() -> dagger.Evals:
return (
dag.evals()
)@func()
example(): Evals {
return dag
.evals()
}Types
Evals 🔗
Dagger's eval suite.
workspacePattern() 🔗
Test the common workspace pattern.
Return Type
WorkspacePattern ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
workspace-patternfunc (m *MyModule) Example() *dagger.EvalsWorkspacePattern {
return dag.
Evals().
WorkspacePattern()
}@function
def example() -> dagger.EvalsWorkspacePattern:
return (
dag.evals()
.workspace_pattern()
)@func()
example(): EvalsWorkspacePattern {
return dag
.evals()
.workspacePattern()
}readImplicitVars() 🔗
Test that the LLM is able to access the content of variables without the user having to expand them in the prompt.
Return Type
ReadImplicitVars ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
read-implicit-varsfunc (m *MyModule) Example() *dagger.EvalsReadImplicitVars {
return dag.
Evals().
ReadImplicitVars()
}@function
def example() -> dagger.EvalsReadImplicitVars:
return (
dag.evals()
.read_implicit_vars()
)@func()
example(): EvalsReadImplicitVars {
return dag
.evals()
.readImplicitVars()
}basic() 🔗
Test basic prompting.
Return Type
Basic ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
basicfunc (m *MyModule) Example() *dagger.EvalsBasic {
return dag.
Evals().
Basic()
}@function
def example() -> dagger.EvalsBasic:
return (
dag.evals()
.basic()
)@func()
example(): EvalsBasic {
return dag
.evals()
.basic()
}lifeAlert() 🔗
Test manual intervention allowing the prompt to succeed.
Return Type
LifeAlert ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
life-alertfunc (m *MyModule) Example() *dagger.EvalsLifeAlert {
return dag.
Evals().
LifeAlert()
}@function
def example() -> dagger.EvalsLifeAlert:
return (
dag.evals()
.life_alert()
)@func()
example(): EvalsLifeAlert {
return dag
.evals()
.lifeAlert()
}buildMulti() 🔗
Test the model’s ability to pass objects around to one another and execute a series of operations given at once.
Return Type
BuildMulti ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
build-multifunc (m *MyModule) Example() *dagger.EvalsBuildMulti {
return dag.
Evals().
BuildMulti()
}@function
def example() -> dagger.EvalsBuildMulti:
return (
dag.evals()
.build_multi()
)@func()
example(): EvalsBuildMulti {
return dag
.evals()
.buildMulti()
}responses() 🔗
Test various response types.
Return Type
Responses ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
responsesfunc (m *MyModule) Example() *dagger.EvalsResponses {
return dag.
Evals().
Responses()
}@function
def example() -> dagger.EvalsResponses:
return (
dag.evals()
.responses()
)@func()
example(): EvalsResponses {
return dag
.evals()
.responses()
}undoChanges() 🔗
Test the model’s eagerness to switch to prior states instead of mutating the current state to undo past actions.
Return Type
UndoChanges ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
undo-changesfunc (m *MyModule) Example() *dagger.EvalsUndoChanges {
return dag.
Evals().
UndoChanges()
}@function
def example() -> dagger.EvalsUndoChanges:
return (
dag.evals()
.undo_changes()
)@func()
example(): EvalsUndoChanges {
return dag
.evals()
.undoChanges()
}coreApi() 🔗
Test that the model is conscious of a “current state” without needing explicit prompting.
Return Type
CoreApi ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
core-apifunc (m *MyModule) Example() *dagger.EvalsCoreApi {
return dag.
Evals().
CoreApi()
}@function
def example() -> dagger.EvalsCoreApi:
return (
dag.evals()
.core_api()
)@func()
example(): EvalsCoreApi {
return dag
.evals()
.coreApi()
}moduleDependencies() 🔗
Test that the model is conscious of a “current state” without needing explicit prompting.
Return Type
ModuleDependencies ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
module-dependenciesfunc (m *MyModule) Example() *dagger.EvalsModuleDependencies {
return dag.
Evals().
ModuleDependencies()
}@function
def example() -> dagger.EvalsModuleDependencies:
return (
dag.evals()
.module_dependencies()
)@func()
example(): EvalsModuleDependencies {
return dag
.evals()
.moduleDependencies()
}buildMultiNoVar() 🔗
BuildMultiNoVar is like BuildMulti but without explicitly referencing the relevant objects, leaving the LLM to figure it out.
Return Type
BuildMultiNoVar ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
build-multi-no-varfunc (m *MyModule) Example() *dagger.EvalsBuildMultiNoVar {
return dag.
Evals().
BuildMultiNoVar()
}@function
def example() -> dagger.EvalsBuildMultiNoVar:
return (
dag.evals()
.build_multi_no_var()
)@func()
example(): EvalsBuildMultiNoVar {
return dag
.evals()
.buildMultiNoVar()
}WorkspacePattern 🔗
name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
workspace-pattern \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
WorkspacePattern().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.workspace_pattern()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.workspacePattern()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
WorkspacePattern().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.workspace_pattern()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.workspacePattern()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
WorkspacePattern().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.workspace_pattern()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.workspacePattern()
.check(prompt)
}ReadImplicitVars 🔗
weirdText() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
read-implicit-vars \
weird-textfunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
ReadImplicitVars().
WeirdText(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.read_implicit_vars()
.weird_text()
)@func()
async example(): Promise<string> {
return dag
.evals()
.readImplicitVars()
.weirdText()
}name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
read-implicit-vars \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
ReadImplicitVars().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.read_implicit_vars()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.readImplicitVars()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
ReadImplicitVars().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.read_implicit_vars()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.readImplicitVars()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
ReadImplicitVars().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.read_implicit_vars()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.readImplicitVars()
.check(prompt)
}Basic 🔗
name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
basic \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
Basic().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.basic()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.basic()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
Basic().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.basic()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.basic()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
Basic().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.basic()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.basic()
.check(prompt)
}LifeAlert 🔗
name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
life-alert \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
LifeAlert().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.life_alert()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.lifeAlert()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
LifeAlert().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.life_alert()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.lifeAlert()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
LifeAlert().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.life_alert()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.lifeAlert()
.check(prompt)
}BuildMulti 🔗
name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
build-multi \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
BuildMulti().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.build_multi()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.buildMulti()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
BuildMulti().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.build_multi()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.buildMulti()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
BuildMulti().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.build_multi()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.buildMulti()
.check(prompt)
}Responses 🔗
name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
responses \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
Responses().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.responses()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.responses()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
Responses().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.responses()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.responses()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
Responses().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.responses()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.responses()
.check(prompt)
}UndoChanges 🔗
name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
undo-changes \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
UndoChanges().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.undo_changes()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.undoChanges()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
UndoChanges().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.undo_changes()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.undoChanges()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
UndoChanges().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.undo_changes()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.undoChanges()
.check(prompt)
}CoreApi 🔗
name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
core-api \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
CoreApi().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.core_api()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.coreApi()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
CoreApi().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.core_api()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.coreApi()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
CoreApi().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.core_api()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.coreApi()
.check(prompt)
}ModuleDependencies 🔗
name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
module-dependencies \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
ModuleDependencies().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.module_dependencies()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.moduleDependencies()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
ModuleDependencies().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.module_dependencies()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.moduleDependencies()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
ModuleDependencies().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.module_dependencies()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.moduleDependencies()
.check(prompt)
}BuildMultiNoVar 🔗
name() 🔗
Return Type
String ! Example
dagger -m github.com/AmirulAndalib/dagger/modules/evals@751ff5db8813c9c9bd746933f81a5fe3c6d2ee48 call \
build-multi-no-var \
namefunc (m *MyModule) Example(ctx context.Context) string {
return dag.
Evals().
BuildMultiNoVar().
Name(ctx)
}@function
async def example() -> str:
return await (
dag.evals()
.build_multi_no_var()
.name()
)@func()
async example(): Promise<string> {
return dag
.evals()
.buildMultiNoVar()
.name()
}prompt() 🔗
Return Type
LLM !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| base | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(base *dagger.LLM) *dagger.LLM {
return dag.
Evals().
BuildMultiNoVar().
Prompt(base)
}@function
def example(base: dagger.LLM) -> dagger.LLM:
return (
dag.evals()
.build_multi_no_var()
.prompt(base)
)@func()
example(base: LLM): LLM {
return dag
.evals()
.buildMultiNoVar()
.prompt(base)
}check() 🔗
Return Type
Void !Arguments
| Name | Type | Default Value | Description |
|---|---|---|---|
| prompt | LLM ! | - | No description provided |
Example
echo 'Custom types are not supported in shell examples'func (m *MyModule) Example(ctx context.Context, prompt *dagger.LLM) {
return dag.
Evals().
BuildMultiNoVar().
Check(ctx, prompt)
}@function
async def example(prompt: dagger.LLM) -> None:
return await (
dag.evals()
.build_multi_no_var()
.check(prompt)
)@func()
async example(prompt: LLM): Promise<void> {
return dag
.evals()
.buildMultiNoVar()
.check(prompt)
}