publish: 21 run(s) — 09d8fbde-0008-49bb-99da-03eeaca72be1, 1bf57c9a-fd7a-49aa-90de-cd1907b15ddd, 212d6278-1b9b-45e9-8aae-7eed4d4ec822…
This commit is contained in:
@@ -2,78 +2,17 @@
|
||||
"id": "e08a7051-a856-4053-b34b-561d7ce5e8cf",
|
||||
"title": "predator-a3b-ngl-ctx-2d-1 \u2014 qwen3 on predator",
|
||||
"date": "2026-05-05",
|
||||
"started_at": "2026-05-05T07:43:00Z",
|
||||
"git_sha": "f06800254dfd046e154c94f663fb7f9f66c79ae3",
|
||||
"hardware": "predator",
|
||||
"hardware_label": "Predator \u00b7 gaming laptop \u00b7 GTX 1060 6 GB \u00b7 28 GB RAM",
|
||||
"engine": "llamacpp",
|
||||
"harness": "predator-a3b-ngl-ctx-2d-1",
|
||||
"model_family": "qwen3",
|
||||
"model_sizes": [
|
||||
"qwen3:30b-a3b-iq2m"
|
||||
],
|
||||
"task_kind": null,
|
||||
"headline": "90 calls across 6 cell(s); ~5.9 tok/s mean; p50 73.4s",
|
||||
"summary_md_path": null,
|
||||
"raw_jsonl_path": "runs/e08a7051-a856-4053-b34b-561d7ce5e8cf.jsonl",
|
||||
"log_path": "runs/e08a7051-a856-4053-b34b-561d7ce5e8cf.log",
|
||||
"synthesis_doc": "A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
|
||||
"cells": [
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl12-ctx64k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 85573.42,
|
||||
"duration_ms_p50": 78940.0,
|
||||
"tokens_per_sec_mean": 5.48,
|
||||
"tokens_per_sec_max": 6.8
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl12-ctx96k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 71805.83,
|
||||
"duration_ms_p50": 58541.0,
|
||||
"tokens_per_sec_mean": 5.79,
|
||||
"tokens_per_sec_max": 6.7
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl12-ctx131k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 96406.17,
|
||||
"duration_ms_p50": 105842.0,
|
||||
"tokens_per_sec_mean": 5.01,
|
||||
"tokens_per_sec_max": 6.29
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl24-ctx48k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 65539.5,
|
||||
"duration_ms_p50": 64606.5,
|
||||
"tokens_per_sec_mean": 6.6,
|
||||
"tokens_per_sec_max": 6.91
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl24-ctx64k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 71267.58,
|
||||
"duration_ms_p50": 80265.5,
|
||||
"tokens_per_sec_mean": 6.41,
|
||||
"tokens_per_sec_max": 6.9
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl24-ctx96k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 69299.5,
|
||||
"duration_ms_p50": 68355.0,
|
||||
"tokens_per_sec_mean": 6.08,
|
||||
"tokens_per_sec_max": 6.69
|
||||
}
|
||||
],
|
||||
"n_calls_total": 90,
|
||||
"n_errors_total": 0,
|
||||
"started_at": "2026-05-05T07:43:00Z",
|
||||
"task_kind": "param-sweep",
|
||||
"tags": [
|
||||
"a3b",
|
||||
"ctx",
|
||||
@@ -82,6 +21,215 @@
|
||||
"predator",
|
||||
"qwen3"
|
||||
],
|
||||
"headline": "90 calls across 6 cell(s); ~5.9 tok/s mean; p50 73.4s",
|
||||
"janie_blurb_md": null,
|
||||
"janie_blurb_status": "pending",
|
||||
"caveat": null,
|
||||
"caveat_severity": null,
|
||||
"methodology_ref": "A3B_AND_CPU_OVERNIGHT_2026-05-05",
|
||||
"methodology_deviations_md": null,
|
||||
"results_table": [
|
||||
{
|
||||
"label": "qwen3:30b-a3b-iq2m-think500-ngl12-ctx64k",
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl12-ctx64k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 85573.42,
|
||||
"duration_ms_p50": 78940.0,
|
||||
"duration_ms_p95": 159864.3,
|
||||
"tokens_per_sec_mean": 5.48,
|
||||
"tokens_per_sec_p50": 5.31,
|
||||
"tokens_per_sec_p95": 6.79,
|
||||
"tokens_per_sec_max": 6.8,
|
||||
"memory_mb": null,
|
||||
"watts_avg": null,
|
||||
"notes": null
|
||||
},
|
||||
{
|
||||
"label": "qwen3:30b-a3b-iq2m-think500-ngl12-ctx96k",
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl12-ctx96k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 71805.83,
|
||||
"duration_ms_p50": 58541.0,
|
||||
"duration_ms_p95": 140580.5,
|
||||
"tokens_per_sec_mean": 5.79,
|
||||
"tokens_per_sec_p50": 5.75,
|
||||
"tokens_per_sec_p95": 6.47,
|
||||
"tokens_per_sec_max": 6.7,
|
||||
"memory_mb": null,
|
||||
"watts_avg": null,
|
||||
"notes": null
|
||||
},
|
||||
{
|
||||
"label": "qwen3:30b-a3b-iq2m-think500-ngl12-ctx131k",
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl12-ctx131k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 96406.17,
|
||||
"duration_ms_p50": 105842.0,
|
||||
"duration_ms_p95": 154492.35,
|
||||
"tokens_per_sec_mean": 5.01,
|
||||
"tokens_per_sec_p50": 5.13,
|
||||
"tokens_per_sec_p95": 5.97,
|
||||
"tokens_per_sec_max": 6.29,
|
||||
"memory_mb": null,
|
||||
"watts_avg": null,
|
||||
"notes": null
|
||||
},
|
||||
{
|
||||
"label": "qwen3:30b-a3b-iq2m-think500-ngl24-ctx48k",
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl24-ctx48k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 65539.5,
|
||||
"duration_ms_p50": 64606.5,
|
||||
"duration_ms_p95": 118069.75,
|
||||
"tokens_per_sec_mean": 6.6,
|
||||
"tokens_per_sec_p50": 6.59,
|
||||
"tokens_per_sec_p95": 6.89,
|
||||
"tokens_per_sec_max": 6.91,
|
||||
"memory_mb": null,
|
||||
"watts_avg": null,
|
||||
"notes": null
|
||||
},
|
||||
{
|
||||
"label": "qwen3:30b-a3b-iq2m-think500-ngl24-ctx64k",
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl24-ctx64k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 71267.58,
|
||||
"duration_ms_p50": 80265.5,
|
||||
"duration_ms_p95": 128231.3,
|
||||
"tokens_per_sec_mean": 6.41,
|
||||
"tokens_per_sec_p50": 6.39,
|
||||
"tokens_per_sec_p95": 6.88,
|
||||
"tokens_per_sec_max": 6.9,
|
||||
"memory_mb": null,
|
||||
"watts_avg": null,
|
||||
"notes": null
|
||||
},
|
||||
{
|
||||
"label": "qwen3:30b-a3b-iq2m-think500-ngl24-ctx96k",
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl24-ctx96k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 69299.5,
|
||||
"duration_ms_p50": 68355.0,
|
||||
"duration_ms_p95": 124990.95,
|
||||
"tokens_per_sec_mean": 6.08,
|
||||
"tokens_per_sec_p50": 6.44,
|
||||
"tokens_per_sec_p95": 6.68,
|
||||
"tokens_per_sec_max": 6.69,
|
||||
"memory_mb": null,
|
||||
"watts_avg": null,
|
||||
"notes": null
|
||||
}
|
||||
],
|
||||
"cells": [
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl12-ctx64k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 85573.42,
|
||||
"duration_ms_p50": 78940.0,
|
||||
"duration_ms_p95": 159864.3,
|
||||
"tokens_per_sec_mean": 5.48,
|
||||
"tokens_per_sec_p50": 5.31,
|
||||
"tokens_per_sec_p95": 6.79,
|
||||
"tokens_per_sec_max": 6.8
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl12-ctx96k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 71805.83,
|
||||
"duration_ms_p50": 58541.0,
|
||||
"duration_ms_p95": 140580.5,
|
||||
"tokens_per_sec_mean": 5.79,
|
||||
"tokens_per_sec_p50": 5.75,
|
||||
"tokens_per_sec_p95": 6.47,
|
||||
"tokens_per_sec_max": 6.7
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl12-ctx131k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 96406.17,
|
||||
"duration_ms_p50": 105842.0,
|
||||
"duration_ms_p95": 154492.35,
|
||||
"tokens_per_sec_mean": 5.01,
|
||||
"tokens_per_sec_p50": 5.13,
|
||||
"tokens_per_sec_p95": 5.97,
|
||||
"tokens_per_sec_max": 6.29
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl24-ctx48k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 65539.5,
|
||||
"duration_ms_p50": 64606.5,
|
||||
"duration_ms_p95": 118069.75,
|
||||
"tokens_per_sec_mean": 6.6,
|
||||
"tokens_per_sec_p50": 6.59,
|
||||
"tokens_per_sec_p95": 6.89,
|
||||
"tokens_per_sec_max": 6.91
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl24-ctx64k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 71267.58,
|
||||
"duration_ms_p50": 80265.5,
|
||||
"duration_ms_p95": 128231.3,
|
||||
"tokens_per_sec_mean": 6.41,
|
||||
"tokens_per_sec_p50": 6.39,
|
||||
"tokens_per_sec_p95": 6.88,
|
||||
"tokens_per_sec_max": 6.9
|
||||
},
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ngl24-ctx96k",
|
||||
"n_calls": 15,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 69299.5,
|
||||
"duration_ms_p50": 68355.0,
|
||||
"duration_ms_p95": 124990.95,
|
||||
"tokens_per_sec_mean": 6.08,
|
||||
"tokens_per_sec_p50": 6.44,
|
||||
"tokens_per_sec_p95": 6.68,
|
||||
"tokens_per_sec_max": 6.69
|
||||
}
|
||||
],
|
||||
"n_calls_total": 90,
|
||||
"n_errors_total": 0,
|
||||
"chart_spec": {
|
||||
"kind": "line",
|
||||
"x": "param_value",
|
||||
"y": "tokens_per_sec_mean",
|
||||
"series": [
|
||||
"qwen3:30b-a3b-iq2m-think500-ngl12-ctx64k",
|
||||
"qwen3:30b-a3b-iq2m-think500-ngl12-ctx96k",
|
||||
"qwen3:30b-a3b-iq2m-think500-ngl12-ctx131k",
|
||||
"qwen3:30b-a3b-iq2m-think500-ngl24-ctx48k",
|
||||
"qwen3:30b-a3b-iq2m-think500-ngl24-ctx64k",
|
||||
"qwen3:30b-a3b-iq2m-think500-ngl24-ctx96k"
|
||||
],
|
||||
"data_url": "/data/e08a7051-a856-4053-b34b-561d7ce5e8cf/run.jsonl"
|
||||
},
|
||||
"site_grade": "standard",
|
||||
"site_grade_reason": null,
|
||||
"raw_data_urls": {
|
||||
"jsonl": "/data/e08a7051-a856-4053-b34b-561d7ce5e8cf/run.jsonl",
|
||||
"log": "/data/e08a7051-a856-4053-b34b-561d7ce5e8cf/run.log",
|
||||
"md": null,
|
||||
"metadata": "/data/e08a7051-a856-4053-b34b-561d7ce5e8cf/metadata.json",
|
||||
"gitea_dir": "https://git.weeyuga.com/slobodanmargetic988/weeyuga-benchmarks-public/src/branch/main/runs/e08a7051-a856-4053-b34b-561d7ce5e8cf/"
|
||||
},
|
||||
"synthesis_doc": "A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
|
||||
"synthesis_docs_all": [
|
||||
"A3B_AND_CPU_OVERNIGHT_2026-05-05.md"
|
||||
],
|
||||
"related_ids": [],
|
||||
"status": "complete",
|
||||
"visibility": "draft",
|
||||
"cells_full": [
|
||||
@@ -91,7 +239,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 85573.42,
|
||||
"duration_ms_p50": 78940.0,
|
||||
"duration_ms_p95": 159864.3,
|
||||
"tokens_per_sec_mean": 5.48,
|
||||
"tokens_per_sec_p50": 5.31,
|
||||
"tokens_per_sec_p95": 6.79,
|
||||
"tokens_per_sec_max": 6.8,
|
||||
"calls": [
|
||||
{
|
||||
@@ -342,7 +493,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 71805.83,
|
||||
"duration_ms_p50": 58541.0,
|
||||
"duration_ms_p95": 140580.5,
|
||||
"tokens_per_sec_mean": 5.79,
|
||||
"tokens_per_sec_p50": 5.75,
|
||||
"tokens_per_sec_p95": 6.47,
|
||||
"tokens_per_sec_max": 6.7,
|
||||
"calls": [
|
||||
{
|
||||
@@ -593,7 +747,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 96406.17,
|
||||
"duration_ms_p50": 105842.0,
|
||||
"duration_ms_p95": 154492.35,
|
||||
"tokens_per_sec_mean": 5.01,
|
||||
"tokens_per_sec_p50": 5.13,
|
||||
"tokens_per_sec_p95": 5.97,
|
||||
"tokens_per_sec_max": 6.29,
|
||||
"calls": [
|
||||
{
|
||||
@@ -844,7 +1001,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 65539.5,
|
||||
"duration_ms_p50": 64606.5,
|
||||
"duration_ms_p95": 118069.75,
|
||||
"tokens_per_sec_mean": 6.6,
|
||||
"tokens_per_sec_p50": 6.59,
|
||||
"tokens_per_sec_p95": 6.89,
|
||||
"tokens_per_sec_max": 6.91,
|
||||
"calls": [
|
||||
{
|
||||
@@ -1095,7 +1255,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 71267.58,
|
||||
"duration_ms_p50": 80265.5,
|
||||
"duration_ms_p95": 128231.3,
|
||||
"tokens_per_sec_mean": 6.41,
|
||||
"tokens_per_sec_p50": 6.39,
|
||||
"tokens_per_sec_p95": 6.88,
|
||||
"tokens_per_sec_max": 6.9,
|
||||
"calls": [
|
||||
{
|
||||
@@ -1346,7 +1509,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 69299.5,
|
||||
"duration_ms_p50": 68355.0,
|
||||
"duration_ms_p95": 124990.95,
|
||||
"tokens_per_sec_mean": 6.08,
|
||||
"tokens_per_sec_p50": 6.44,
|
||||
"tokens_per_sec_p95": 6.68,
|
||||
"tokens_per_sec_max": 6.69,
|
||||
"calls": [
|
||||
{
|
||||
@@ -1641,5 +1807,5 @@
|
||||
},
|
||||
"methodology_notes": "Sloba 2026-05-05: 'max tokens should be bigger than reasoning budget'. Prior bench had hello max_tokens=256 < reasoning_budget=500 \u2192 content_chars=0. Bumped to 512/1024/2048 so reasoning + answer both fit."
|
||||
},
|
||||
"packaged_at": "2026-05-05T17:43:34Z"
|
||||
"packaged_at": "2026-05-06T08:04:27Z"
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user