@@ -9,22 +9,10 @@ import { evaluationAgent } from '../agents/evaluationAgent'
99import { imageToCsvAgent } from '../agents/image_to_csv'
1010import { csvToExcalidrawAgent } from '../agents/csv_to_excalidraw'
1111import { weatherAgent } from '../agents/weather-agent'
12- import {
13- structureScorer ,
14- creativityScorer ,
15- sqlValidityScorer ,
16- toneConsistencyScorer ,
17- responseQualityScorer ,
18- scriptFormatScorer ,
19- pacingScorer ,
20- financialDataScorer ,
21- sourceDiversityScorer ,
22- csvValidityScorer ,
23- factualityScorer
24- } from '../scorers'
12+ import { log } from '../config/logger' ;
2513
2614export async function runContentStrategistExperiment ( ) {
27- console . log ( 'Running Content Strategist Experiment...' )
15+ log . info ( 'Running Content Strategist Experiment' , { event : 'Running Content Strategist Experiment' } )
2816 const results = await runEvals ( {
2917 target : contentStrategistAgent ,
3018 data : [
@@ -38,14 +26,14 @@ export async function runContentStrategistExperiment() {
3826 input : 'Plan a blog series for a B2B SaaS accounting tool. Target audience: CFOs. Tone: Professional and authoritative.'
3927 }
4028 ] ,
41- scorers : [ structureScorer , creativityScorer , toneConsistencyScorer ]
29+ scorers : [ ]
4230 } )
43- console . log ( 'Content Strategist Experiment Results: ' , JSON . stringify ( results , null , 2 ) )
31+ log . info ( 'Content Strategist Experiment Results' , { results : JSON . stringify ( results , null , 2 ) } )
4432 return results
4533}
4634
4735export async function runCopywriterExperiment ( ) {
48- console . log ( 'Running Copywriter Experiment...' )
36+ log . info ( 'Running Copywriter Experiment...' )
4937 const results = await runEvals ( {
5038 target : copywriterAgent ,
5139 data : [
@@ -59,14 +47,14 @@ export async function runCopywriterExperiment() {
5947 input : 'Write a product description for a luxury watch. Tone: Sophisticated and elegant.' ,
6048 }
6149 ] ,
62- scorers : [ toneConsistencyScorer , creativityScorer , responseQualityScorer ]
50+ scorers : [ ]
6351 } )
64- console . log ( 'Copywriter Experiment Results:' , JSON . stringify ( results , null , 2 ) )
52+ log . info ( 'Copywriter Experiment Results:' , { results : JSON . stringify ( results , null , 2 ) } )
6553 return results
6654}
6755
6856export async function runScriptWriterExperiment ( ) {
69- console . log ( 'Running Script Writer Experiment...' )
57+ log . info ( 'Running Script Writer Experiment...' )
7058 const results = await runEvals ( {
7159 target : scriptWriterAgent ,
7260 data : [
@@ -77,14 +65,14 @@ export async function runScriptWriterExperiment() {
7765 input : 'Create a YouTube intro for a tech review channel.' ,
7866 }
7967 ] ,
80- scorers : [ scriptFormatScorer , pacingScorer , creativityScorer ]
68+ scorers : [ ]
8169 } )
82- console . log ( 'Script Writer Experiment Results:' , JSON . stringify ( results , null , 2 ) )
70+ log . info ( 'Script Writer Experiment Results:' , { results : JSON . stringify ( results , null , 2 ) } )
8371 return results
8472}
8573
8674export async function runStockAnalysisExperiment ( ) {
87- console . log ( 'Running Stock Analysis Experiment...' )
75+ log . info ( 'Running Stock Analysis Experiment...' )
8876 const results = await runEvals ( {
8977 target : stockAnalysisAgent ,
9078 data : [
@@ -95,14 +83,14 @@ export async function runStockAnalysisExperiment() {
9583 input : 'Should I buy TSLA right now?' ,
9684 }
9785 ] ,
98- scorers : [ financialDataScorer , responseQualityScorer , sourceDiversityScorer ]
86+ scorers : [ ]
9987 } )
100- console . log ( 'Stock Analysis Experiment Results:' , JSON . stringify ( results , null , 2 ) )
88+ log . info ( 'Stock Analysis Experiment Results:' , { results : JSON . stringify ( results , null , 2 ) } )
10189 return results
10290}
10391
10492export async function runReportAgentExperiment ( ) {
105- console . log ( 'Running Report Agent Experiment...' )
93+ log . info ( 'Running Report Agent Experiment...' )
10694 const results = await runEvals ( {
10795 target : reportAgent ,
10896 data : [
@@ -113,74 +101,74 @@ export async function runReportAgentExperiment() {
113101 input : 'Summarize the key findings from the user research interviews.' ,
114102 }
115103 ] ,
116- scorers : [ structureScorer , responseQualityScorer , factualityScorer ]
104+ scorers : [ ]
117105 } )
118- console . log ( 'Report Agent Experiment Results:' , JSON . stringify ( results , null , 2 ) )
106+ log . info ( 'Report Agent Experiment Results:' , { results : JSON . stringify ( results , null , 2 ) } )
119107 return results
120108}
121109
122110export async function runLearningExtractionExperiment ( ) {
123- console . log ( 'Running Learning Extraction Experiment...' )
111+ log . info ( 'Running Learning Extraction Experiment...' )
124112 const results = await runEvals ( {
125113 target : learningExtractionAgent ,
126114 data : [
127115 {
128116 input : 'Extract key learning points from this article about Rust ownership.'
129117 }
130118 ] ,
131- scorers : [ responseQualityScorer , factualityScorer ]
119+ scorers : [ ]
132120 } )
133- console . log ( 'Learning Extraction Experiment Results:' , JSON . stringify ( results , null , 2 ) )
134- return results
121+ log . info ( 'Learning Extraction Experiment Results:' , { results : JSON . stringify ( results , null , 2 ) } )
122+ return results
135123}
136124
137125export async function runEvaluationAgentExperiment ( ) {
138- console . log ( 'Running Evaluation Agent Experiment...' )
126+ log . info ( 'Running Evaluation Agent Experiment...' )
139127 const results = await runEvals ( {
140128 target : evaluationAgent ,
141129 data : [
142130 {
143131 input : 'Evaluate this python code for efficiency: def fib(n): return n if n < 2 else fib(n-1) + fib(n-2)' ,
144132 }
145133 ] ,
146- scorers : [ responseQualityScorer , structureScorer ]
134+ scorers : [ ]
147135 } )
148- console . log ( 'Evaluation Agent Experiment Results:' , JSON . stringify ( results , null , 2 ) )
136+ log . info ( 'Evaluation Agent Experiment Results:' , { results : JSON . stringify ( results , null , 2 ) } )
149137 return results
150138}
151139
152140export async function runImageToCsvExperiment ( ) {
153- console . log ( 'Running Image to CSV Experiment...' )
141+ log . info ( 'Running Image to CSV Experiment...' )
154142 const results = await runEvals ( {
155143 target : imageToCsvAgent ,
156144 data : [
157145 {
158146 input : 'https://raw.githubusercontent.com/datasciencedojo/datasets/master/titanic.csv' ,
159147 }
160148 ] ,
161- scorers : [ csvValidityScorer , structureScorer ]
149+ scorers : [ ]
162150 } )
163- console . log ( 'Image to CSV Experiment Results:' , JSON . stringify ( results , null , 2 ) )
151+ log . info ( 'Image to CSV Experiment Results:' , { results : JSON . stringify ( results , null , 2 ) } )
164152 return results
165153}
166154
167155export async function runCsvToExcalidrawExperiment ( ) {
168- console . log ( 'Running CSV to Excalidraw Experiment...' )
156+ log . info ( 'Running CSV to Excalidraw Experiment...' )
169157 const results = await runEvals ( {
170158 target : csvToExcalidrawAgent ,
171159 data : [
172160 {
173161 input : 'id,label,x,y\n1,Start,0,0\n2,Process,100,0\n3,End,200,0' ,
174162 }
175163 ] ,
176- scorers : [ structureScorer , responseQualityScorer ]
164+ scorers : [ ]
177165 } )
178- console . log ( 'CSV to Excalidraw Experiment Results:' , JSON . stringify ( results , null , 2 ) )
166+ log . info ( 'CSV to Excalidraw Experiment Results:' , { results : JSON . stringify ( results , null , 2 ) } )
179167 return results
180168}
181169
182170export async function runWeatherAgentExperiment ( ) {
183- console . log ( 'Running Weather Agent Experiment...' )
171+ log . info ( 'Running Weather Agent Experiment...' )
184172 const results = await runEvals ( {
185173 target : weatherAgent ,
186174 data : [
@@ -191,9 +179,9 @@ export async function runWeatherAgentExperiment() {
191179 input : 'Forecast for London tomorrow.' ,
192180 }
193181 ] ,
194- scorers : [ factualityScorer , responseQualityScorer ]
182+ scorers : [ ]
195183 } )
196- console . log ( 'Weather Agent Experiment Results:' , JSON . stringify ( results , null , 2 ) )
184+ log . info ( 'Weather Agent Experiment Results:' , { results : JSON . stringify ( results , null , 2 ) } )
197185 return results
198186}
199187
0 commit comments