|
22 | 22 | EvaluationThresholdDict, |
23 | 23 | EvaluateResult, |
24 | 24 | Status, |
| 25 | + EPParameters, |
25 | 26 | ) |
26 | 27 | from eval_protocol.pytest.dual_mode_wrapper import create_dual_mode_wrapper |
27 | 28 | from eval_protocol.pytest.evaluation_test_postprocess import postprocess |
@@ -753,13 +754,34 @@ async def _collect_result(config, lst): |
753 | 754 | ) |
754 | 755 | pytest_wrapper = pytest.mark.asyncio(pytest_wrapper) |
755 | 756 |
|
756 | | - ep_params: dict[str, Any] = { |
757 | | - "rollout_processor": rollout_processor, |
758 | | - "server_script_path": server_script_path, |
759 | | - "mcp_config_path": mcp_config_path, |
760 | | - "rollout_processor_kwargs": rollout_processor_kwargs, |
761 | | - "mode": mode, |
762 | | - } |
| 757 | + # Attach full evaluation parameter metadata for training integrations |
| 758 | + ep_params: EPParameters = EPParameters( |
| 759 | + completion_params=completion_params, |
| 760 | + input_messages=input_messages, |
| 761 | + input_dataset=input_dataset, |
| 762 | + input_rows=input_rows, |
| 763 | + data_loaders=data_loaders, |
| 764 | + dataset_adapter=dataset_adapter, |
| 765 | + rollout_processor=rollout_processor, |
| 766 | + rollout_processor_kwargs=rollout_processor_kwargs, |
| 767 | + evaluation_test_kwargs=evaluation_test_kwargs, |
| 768 | + aggregation_method=aggregation_method, |
| 769 | + passed_threshold=passed_threshold, |
| 770 | + disable_browser_open=disable_browser_open, |
| 771 | + num_runs=num_runs, |
| 772 | + filtered_row_ids=filtered_row_ids, |
| 773 | + max_dataset_rows=max_dataset_rows, |
| 774 | + mcp_config_path=mcp_config_path, |
| 775 | + max_concurrent_rollouts=max_concurrent_rollouts, |
| 776 | + max_concurrent_evaluations=max_concurrent_evaluations, |
| 777 | + server_script_path=server_script_path, |
| 778 | + steps=steps, |
| 779 | + mode=mode, |
| 780 | + combine_datasets=combine_datasets, |
| 781 | + preprocess_fn=preprocess_fn, |
| 782 | + logger=logger, |
| 783 | + exception_handler_config=exception_handler_config, |
| 784 | + ) |
763 | 785 |
|
764 | 786 | # Create the dual mode wrapper |
765 | 787 | dual_mode_wrapper = create_dual_mode_wrapper( |
|
0 commit comments