From fe3766d5f915aa388e9a47d4e1508a5c21208520 Mon Sep 17 00:00:00 2001 From: LearningCircuit <185559241+LearningCircuit@users.noreply.github.com> Date: Fri, 1 May 2026 20:41:44 +0200 Subject: [PATCH 1/3] Add files via upload --- .../serper/qwen3.6-27b_2026-05-01.yaml | 23 +++++++++++++++++++ 1 file changed, 23 insertions(+) create mode 100644 results/xbench-deepsearch/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml diff --git a/results/xbench-deepsearch/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml b/results/xbench-deepsearch/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml new file mode 100644 index 0000000..5104764 --- /dev/null +++ b/results/xbench-deepsearch/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml @@ -0,0 +1,23 @@ +model: qwen3.6:27b +model_provider: OLLAMA +search_engine: serper +average_results_per_query: 22 +results: + dataset: SimpleQA + total_questions: 300 + langgraph-agent: + accuracy: "95.7% (287/300)" + iterations: 10 + questions_per_iteration: 1 + avg_time_per_question: "1m 54s" +configuration: + temperature: 0.7 + context_window: 20480 # captured at benchmark start + max_tokens: 30000 # captured at benchmark start +evaluator: + model: qwen3.6:27b + provider: ollama + temperature: 0 +versions: + ldr_version: 1.6.7 +date_tested: 2026-05-01 From 9aa3603153fec757dc5b9302afdd313e12952ff9 Mon Sep 17 00:00:00 2001 From: LearningCircuit <185559241+LearningCircuit@users.noreply.github.com> Date: Fri, 1 May 2026 20:47:34 +0200 Subject: [PATCH 2/3] Add configuration for qwen3.6 model evaluation --- .../serper/qwen3.6-27b_2026-05-01.yaml | 23 +++++++++++++++++++ 1 file changed, 23 insertions(+) create mode 100644 results/simpleqa/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml diff --git a/results/simpleqa/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml b/results/simpleqa/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml new file mode 100644 index 0000000..5104764 --- /dev/null +++ b/results/simpleqa/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml @@ -0,0 +1,23 @@ +model: qwen3.6:27b +model_provider: OLLAMA +search_engine: serper +average_results_per_query: 22 +results: + dataset: SimpleQA + total_questions: 300 + langgraph-agent: + accuracy: "95.7% (287/300)" + iterations: 10 + questions_per_iteration: 1 + avg_time_per_question: "1m 54s" +configuration: + temperature: 0.7 + context_window: 20480 # captured at benchmark start + max_tokens: 30000 # captured at benchmark start +evaluator: + model: qwen3.6:27b + provider: ollama + temperature: 0 +versions: + ldr_version: 1.6.7 +date_tested: 2026-05-01 From b067af7d04582282a9fd82508b86977054b62b94 Mon Sep 17 00:00:00 2001 From: LearningCircuit <185559241+LearningCircuit@users.noreply.github.com> Date: Fri, 1 May 2026 20:48:01 +0200 Subject: [PATCH 3/3] Delete results/xbench-deepsearch/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml --- .../serper/qwen3.6-27b_2026-05-01.yaml | 23 ------------------- 1 file changed, 23 deletions(-) delete mode 100644 results/xbench-deepsearch/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml diff --git a/results/xbench-deepsearch/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml b/results/xbench-deepsearch/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml deleted file mode 100644 index 5104764..0000000 --- a/results/xbench-deepsearch/langgraph-agent/serper/qwen3.6-27b_2026-05-01.yaml +++ /dev/null @@ -1,23 +0,0 @@ -model: qwen3.6:27b -model_provider: OLLAMA -search_engine: serper -average_results_per_query: 22 -results: - dataset: SimpleQA - total_questions: 300 - langgraph-agent: - accuracy: "95.7% (287/300)" - iterations: 10 - questions_per_iteration: 1 - avg_time_per_question: "1m 54s" -configuration: - temperature: 0.7 - context_window: 20480 # captured at benchmark start - max_tokens: 30000 # captured at benchmark start -evaluator: - model: qwen3.6:27b - provider: ollama - temperature: 0 -versions: - ldr_version: 1.6.7 -date_tested: 2026-05-01