From c2aa0b46cf278a753edccc7ee1dff638b8abd279 Mon Sep 17 00:00:00 2001 From: LearningCircuit <185559241+LearningCircuit@users.noreply.github.com> Date: Wed, 15 Apr 2026 01:25:10 +0200 Subject: [PATCH] results: gemma4:26b SimpleQA 73.1% (300q, langgraph_agent) LDR v1.5.6 exporter had the known strategy-mislabeling bug (fixed in LearningCircuit/local-deep-research#3442). Relabeled from source_based to langgraph_agent. --- .../serper/gemma4-26b_2026-04-14.yaml | 22 +++++++++++++++++++ 1 file changed, 22 insertions(+) create mode 100644 results/simpleqa/langgraph-agent/serper/gemma4-26b_2026-04-14.yaml diff --git a/results/simpleqa/langgraph-agent/serper/gemma4-26b_2026-04-14.yaml b/results/simpleqa/langgraph-agent/serper/gemma4-26b_2026-04-14.yaml new file mode 100644 index 0000000..65ea6bb --- /dev/null +++ b/results/simpleqa/langgraph-agent/serper/gemma4-26b_2026-04-14.yaml @@ -0,0 +1,22 @@ +model: gemma4:26b +model_provider: OLLAMA +search_engine: serper +results: + dataset: SimpleQA + total_questions: 300 + langgraph_agent: + accuracy: "73.1% (219/300)" + iterations: 10 + questions_per_iteration: 1 + avg_time_per_question: "23.6s" +configuration: + temperature: 0.7 + context_window: 36352 # captured at benchmark start + max_tokens: 30000 # captured at benchmark start +evaluator: + model: gemma4:26b + provider: ollama + temperature: 0 +versions: + ldr_version: 1.5.6 +date_tested: 2026-04-14