@@ -35,6 +35,7 @@ type Runner struct {
3535 envProvider environment.Provider
3636 ttyFd int
3737 only []string
38+ baseImage string
3839}
3940
4041// NewRunner creates a new evaluation runner.
@@ -48,16 +49,17 @@ func NewRunner(agentSource config.Source, runConfig *config.RuntimeConfig, evals
4849 envProvider : runConfig .EnvProvider (),
4950 ttyFd : cfg .TTYFd ,
5051 only : cfg .Only ,
52+ baseImage : cfg .BaseImage ,
5153 }
5254}
5355
5456// Evaluate is the main entry point for running evaluations.
55- func Evaluate (ctx context.Context , out io.Writer , isTTY bool , ttyFd int , agentFilename , evalsDir string , runConfig * config.RuntimeConfig , concurrency int , judgeModel provider.Provider , only []string ) (* EvalRun , error ) {
56- return EvaluateWithName (ctx , out , isTTY , ttyFd , GenerateRunName (), agentFilename , evalsDir , runConfig , concurrency , judgeModel , only )
57+ func Evaluate (ctx context.Context , out io.Writer , isTTY bool , ttyFd int , agentFilename , evalsDir string , runConfig * config.RuntimeConfig , concurrency int , judgeModel provider.Provider , only []string , baseImage string ) (* EvalRun , error ) {
58+ return EvaluateWithName (ctx , out , isTTY , ttyFd , GenerateRunName (), agentFilename , evalsDir , runConfig , concurrency , judgeModel , only , baseImage )
5759}
5860
5961// EvaluateWithName runs evaluations with a specified run name.
60- func EvaluateWithName (ctx context.Context , out io.Writer , isTTY bool , ttyFd int , runName , agentFilename , evalsDir string , runConfig * config.RuntimeConfig , concurrency int , judgeModel provider.Provider , only []string ) (* EvalRun , error ) {
62+ func EvaluateWithName (ctx context.Context , out io.Writer , isTTY bool , ttyFd int , runName , agentFilename , evalsDir string , runConfig * config.RuntimeConfig , concurrency int , judgeModel provider.Provider , only []string , baseImage string ) (* EvalRun , error ) {
6163 agentSource , err := config .Resolve (agentFilename )
6264 if err != nil {
6365 return nil , fmt .Errorf ("resolving agent: %w" , err )
@@ -68,6 +70,7 @@ func EvaluateWithName(ctx context.Context, out io.Writer, isTTY bool, ttyFd int,
6870 JudgeModel : judgeModel ,
6971 TTYFd : ttyFd ,
7072 Only : only ,
73+ BaseImage : baseImage ,
7174 })
7275
7376 fmt .Fprintf (out , "Evaluation run: %s\n " , runName )
0 commit comments