From 00aef39e72345f53375e7ca119870b84f75a1878 Mon Sep 17 00:00:00 2001 From: LearningCircuit <185559241+LearningCircuit@users.noreply.github.com> Date: Thu, 9 Apr 2026 20:36:47 +0200 Subject: [PATCH] fix: relabel qwen3.5:9b 2026-04-07 as xbench_deepsearch (was mislabeled SimpleQA) The LDR YAML exporter hard-coded dataset as "SimpleQA". This run was actually xbench_deepsearch. Move to results/xbench-deepsearch/ and fix the dataset field. LDR exporter fix: LearningCircuit/local-deep-research#3442 --- .../langgraph-agent/serper/qwen3.5-9b_2026-04-07.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) rename results/{simpleqa => xbench-deepsearch}/langgraph-agent/serper/qwen3.5-9b_2026-04-07.yaml (94%) diff --git a/results/simpleqa/langgraph-agent/serper/qwen3.5-9b_2026-04-07.yaml b/results/xbench-deepsearch/langgraph-agent/serper/qwen3.5-9b_2026-04-07.yaml similarity index 94% rename from results/simpleqa/langgraph-agent/serper/qwen3.5-9b_2026-04-07.yaml rename to results/xbench-deepsearch/langgraph-agent/serper/qwen3.5-9b_2026-04-07.yaml index f1576cc..d327ea6 100644 --- a/results/simpleqa/langgraph-agent/serper/qwen3.5-9b_2026-04-07.yaml +++ b/results/xbench-deepsearch/langgraph-agent/serper/qwen3.5-9b_2026-04-07.yaml @@ -2,7 +2,7 @@ model: qwen3.5:9b model_provider: OLLAMA search_engine: serper results: - dataset: SimpleQA + dataset: xbench_deepsearch total_questions: 100 langgraph_agent: accuracy: "59.0% (59/100)"