From da459521ffdc9ceacc237c6e2fb9db3a59d62681 Mon Sep 17 00:00:00 2001 From: LearningCircuit <185559241+LearningCircuit@users.noreply.github.com> Date: Sat, 16 May 2026 13:36:11 +0200 Subject: [PATCH] Results for 1.6.10 ~2% performance drop within statistical variance --- .../serper/qwen3.6-27b_2026-05-11.yaml | 23 +++++++++++++++++++ 1 file changed, 23 insertions(+) create mode 100644 results/simpleqa/langgraph-agent/serper/qwen3.6-27b_2026-05-11.yaml diff --git a/results/simpleqa/langgraph-agent/serper/qwen3.6-27b_2026-05-11.yaml b/results/simpleqa/langgraph-agent/serper/qwen3.6-27b_2026-05-11.yaml new file mode 100644 index 0000000..d8a7f86 --- /dev/null +++ b/results/simpleqa/langgraph-agent/serper/qwen3.6-27b_2026-05-11.yaml @@ -0,0 +1,23 @@ +model: qwen3.6:27b +model_provider: ollama +search_engine: serper +average_results_per_query: 21 +results: + dataset: SimpleQA + total_questions: 400 + langgraph-agent: + accuracy: "93.5% (374/400)" + iterations: 3 + questions_per_iteration: 1 + avg_time_per_question: "2m 24s" +configuration: + temperature: 0.7 + context_window: 20480 # captured at benchmark start + max_tokens: 30000 # captured at benchmark start +evaluator: + model: qwen3.6:27b + provider: ollama + temperature: 0 +versions: + ldr_version: 1.6.10 +date_tested: 2026-05-11