50
50
from watchdog .observers import Observer
51
51
52
52
from . import agent_graph
53
- from ..agents .base_agent import BaseAgent
54
53
from ..agents .live_request_queue import LiveRequest
55
54
from ..agents .live_request_queue import LiveRequestQueue
56
55
from ..agents .run_config import RunConfig
57
56
from ..agents .run_config import StreamingMode
58
57
from ..artifacts .base_artifact_service import BaseArtifactService
59
58
from ..auth .credential_service .base_credential_service import BaseCredentialService
60
59
from ..errors .not_found_error import NotFoundError
61
- from ..evaluation .base_eval_service import BaseEvalService
62
60
from ..evaluation .base_eval_service import InferenceConfig
63
61
from ..evaluation .base_eval_service import InferenceRequest
64
62
from ..evaluation .constants import MISSING_EVAL_DEPENDENCIES_MESSAGE
@@ -314,17 +312,6 @@ def __init__(
314
312
self .current_app_name_ref : SharedValue [str ] = SharedValue (value = "" )
315
313
self .runner_dict = {}
316
314
317
- def _get_eval_service (self , agent : BaseAgent ):
318
- from ..evaluation .local_eval_service import LocalEvalService # pylint: disable=g-import-not-at-top
319
-
320
- return LocalEvalService (
321
- root_agent = agent ,
322
- eval_sets_manager = self .eval_sets_manager ,
323
- eval_set_results_manager = self .eval_set_results_manager ,
324
- session_service = self .session_service ,
325
- artifact_service = self .artifact_service ,
326
- )
327
-
328
315
async def get_runner_async (self , app_name : str ) -> Runner :
329
316
"""Returns the runner for the given app."""
330
317
if app_name in self .runners_to_clean :
@@ -789,6 +776,7 @@ async def run_eval(
789
776
# Create a mapping from eval set file to all the evals that needed to be
790
777
# run.
791
778
try :
779
+ from ..evaluation .local_eval_service import LocalEvalService
792
780
from .cli_eval import _collect_eval_results
793
781
from .cli_eval import _collect_inferences
794
782
@@ -801,7 +789,15 @@ async def run_eval(
801
789
802
790
root_agent = self .agent_loader .load_agent (app_name )
803
791
804
- eval_service = self ._get_eval_service (root_agent )
792
+ eval_case_results = []
793
+
794
+ eval_service = LocalEvalService (
795
+ root_agent = root_agent ,
796
+ eval_sets_manager = self .eval_sets_manager ,
797
+ eval_set_results_manager = self .eval_set_results_manager ,
798
+ session_service = self .session_service ,
799
+ artifact_service = self .artifact_service ,
800
+ )
805
801
inference_request = InferenceRequest (
806
802
app_name = app_name ,
807
803
eval_set_id = eval_set .eval_set_id ,
0 commit comments