publish: 21 run(s) — 09d8fbde-0008-49bb-99da-03eeaca72be1, 1bf57c9a-fd7a-49aa-90de-cd1907b15ddd, 212d6278-1b9b-45e9-8aae-7eed4d4ec822…

This commit is contained in:
2026-05-06 10:04:27 +02:00
parent a18db6a3da
commit 947c361b9c
22 changed files with 6182 additions and 1423 deletions

View File

@@ -2,51 +2,17 @@
"id": "b37836bf-d1a2-4d6b-a732-aff89da1fa07",
"title": "predator-a3b-ngl-matrix-1 \u2014 qwen3 on predator",
"date": "2026-05-04",
"started_at": "2026-05-04T22:50:47Z",
"git_sha": "f06800254dfd046e154c94f663fb7f9f66c79ae3",
"hardware": "predator",
"hardware_label": "Predator \u00b7 gaming laptop \u00b7 GTX 1060 6 GB \u00b7 28 GB RAM",
"engine": "llamacpp",
"harness": "predator-a3b-ngl-matrix-1",
"model_family": "qwen3",
"model_sizes": [
"qwen3:30b-a3b-iq2m"
],
"task_kind": null,
"headline": "42 calls across 3 cell(s); ~5.7 tok/s mean; p50 71.5s",
"summary_md_path": null,
"raw_jsonl_path": "runs/b37836bf-d1a2-4d6b-a732-aff89da1fa07.jsonl",
"log_path": "runs/b37836bf-d1a2-4d6b-a732-aff89da1fa07.log",
"synthesis_doc": "A3B_NGL_RETUNE_2026-05-05.md",
"cells": [
{
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ctx32k-ngl6",
"n_calls": 14,
"n_errors": 0,
"duration_ms_mean": 85436.42,
"duration_ms_p50": 92483.0,
"tokens_per_sec_mean": 4.95,
"tokens_per_sec_max": 5.15
},
{
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ctx32k-ngl12",
"n_calls": 14,
"n_errors": 0,
"duration_ms_mean": 75013.58,
"duration_ms_p50": 81347.0,
"tokens_per_sec_mean": 5.59,
"tokens_per_sec_max": 6.63
},
{
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ctx32k-ngl24",
"n_calls": 14,
"n_errors": 0,
"duration_ms_mean": 62607.33,
"duration_ms_p50": 67049.0,
"tokens_per_sec_mean": 6.58,
"tokens_per_sec_max": 6.89
}
],
"n_calls_total": 42,
"n_errors_total": 0,
"started_at": "2026-05-04T22:50:47Z",
"task_kind": "param-sweep",
"tags": [
"a3b",
"iq2",
@@ -55,6 +21,129 @@
"predator",
"qwen3"
],
"headline": "42 calls across 3 cell(s); ~5.7 tok/s mean; p50 71.5s",
"janie_blurb_md": null,
"janie_blurb_status": "pending",
"caveat": null,
"caveat_severity": null,
"methodology_ref": "A3B_AND_CPU_OVERNIGHT_2026-05-05",
"methodology_deviations_md": null,
"results_table": [
{
"label": "qwen3:30b-a3b-iq2m-think500-ctx32k-ngl6",
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ctx32k-ngl6",
"n_calls": 14,
"n_errors": 0,
"duration_ms_mean": 85436.42,
"duration_ms_p50": 92483.0,
"duration_ms_p95": 154201.8,
"tokens_per_sec_mean": 4.95,
"tokens_per_sec_p50": 4.98,
"tokens_per_sec_p95": 5.15,
"tokens_per_sec_max": 5.15,
"memory_mb": null,
"watts_avg": null,
"notes": null
},
{
"label": "qwen3:30b-a3b-iq2m-think500-ctx32k-ngl12",
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ctx32k-ngl12",
"n_calls": 14,
"n_errors": 0,
"duration_ms_mean": 75013.58,
"duration_ms_p50": 81347.0,
"duration_ms_p95": 146474.55,
"tokens_per_sec_mean": 5.59,
"tokens_per_sec_p50": 5.36,
"tokens_per_sec_p95": 6.61,
"tokens_per_sec_max": 6.63,
"memory_mb": null,
"watts_avg": null,
"notes": null
},
{
"label": "qwen3:30b-a3b-iq2m-think500-ctx32k-ngl24",
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ctx32k-ngl24",
"n_calls": 14,
"n_errors": 0,
"duration_ms_mean": 62607.33,
"duration_ms_p50": 67049.0,
"duration_ms_p95": 123041.65,
"tokens_per_sec_mean": 6.58,
"tokens_per_sec_p50": 6.68,
"tokens_per_sec_p95": 6.88,
"tokens_per_sec_max": 6.89,
"memory_mb": null,
"watts_avg": null,
"notes": null
}
],
"cells": [
{
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ctx32k-ngl6",
"n_calls": 14,
"n_errors": 0,
"duration_ms_mean": 85436.42,
"duration_ms_p50": 92483.0,
"duration_ms_p95": 154201.8,
"tokens_per_sec_mean": 4.95,
"tokens_per_sec_p50": 4.98,
"tokens_per_sec_p95": 5.15,
"tokens_per_sec_max": 5.15
},
{
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ctx32k-ngl12",
"n_calls": 14,
"n_errors": 0,
"duration_ms_mean": 75013.58,
"duration_ms_p50": 81347.0,
"duration_ms_p95": 146474.55,
"tokens_per_sec_mean": 5.59,
"tokens_per_sec_p50": 5.36,
"tokens_per_sec_p95": 6.61,
"tokens_per_sec_max": 6.63
},
{
"cell_id": "predator:llamacpp:qwen3:30b-a3b-iq2m-think500-ctx32k-ngl24",
"n_calls": 14,
"n_errors": 0,
"duration_ms_mean": 62607.33,
"duration_ms_p50": 67049.0,
"duration_ms_p95": 123041.65,
"tokens_per_sec_mean": 6.58,
"tokens_per_sec_p50": 6.68,
"tokens_per_sec_p95": 6.88,
"tokens_per_sec_max": 6.89
}
],
"n_calls_total": 42,
"n_errors_total": 0,
"chart_spec": {
"kind": "line",
"x": "param_value",
"y": "tokens_per_sec_mean",
"series": [
"qwen3:30b-a3b-iq2m-think500-ctx32k-ngl6",
"qwen3:30b-a3b-iq2m-think500-ctx32k-ngl12",
"qwen3:30b-a3b-iq2m-think500-ctx32k-ngl24"
],
"data_url": "/data/b37836bf-d1a2-4d6b-a732-aff89da1fa07/run.jsonl"
},
"site_grade": "standard",
"site_grade_reason": null,
"raw_data_urls": {
"jsonl": "/data/b37836bf-d1a2-4d6b-a732-aff89da1fa07/run.jsonl",
"log": "/data/b37836bf-d1a2-4d6b-a732-aff89da1fa07/run.log",
"md": null,
"metadata": "/data/b37836bf-d1a2-4d6b-a732-aff89da1fa07/metadata.json",
"gitea_dir": "https://git.weeyuga.com/slobodanmargetic988/weeyuga-benchmarks-public/src/branch/main/runs/b37836bf-d1a2-4d6b-a732-aff89da1fa07/"
},
"synthesis_doc": "A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
"synthesis_docs_all": [
"A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
"A3B_NGL_RETUNE_2026-05-05.md"
],
"related_ids": [],
"status": "complete",
"visibility": "draft",
"cells_full": [
@@ -64,7 +153,10 @@
"n_errors": 0,
"duration_ms_mean": 85436.42,
"duration_ms_p50": 92483.0,
"duration_ms_p95": 154201.8,
"tokens_per_sec_mean": 4.95,
"tokens_per_sec_p50": 4.98,
"tokens_per_sec_p95": 5.15,
"tokens_per_sec_max": 5.15,
"calls": [
{
@@ -293,7 +385,10 @@
"n_errors": 0,
"duration_ms_mean": 75013.58,
"duration_ms_p50": 81347.0,
"duration_ms_p95": 146474.55,
"tokens_per_sec_mean": 5.59,
"tokens_per_sec_p50": 5.36,
"tokens_per_sec_p95": 6.61,
"tokens_per_sec_max": 6.63,
"calls": [
{
@@ -522,7 +617,10 @@
"n_errors": 0,
"duration_ms_mean": 62607.33,
"duration_ms_p50": 67049.0,
"duration_ms_p95": 123041.65,
"tokens_per_sec_mean": 6.58,
"tokens_per_sec_p50": 6.68,
"tokens_per_sec_p95": 6.88,
"tokens_per_sec_max": 6.89,
"calls": [
{
@@ -766,5 +864,5 @@
"sampling": "T=0.6 top_p=0.95 top_k=20 (Qwen3-A3B README defaults)",
"common_args": "--ctx-size 32768 --temp 0.6 --top-p 0.95 --top-k 20 --min-p 0.0 --reasoning-budget 500 --reasoning-format deepseek --jinja --no-warmup --host 0.0.0.0 --port 11436"
},
"packaged_at": "2026-05-05T17:43:34Z"
"packaged_at": "2026-05-06T08:04:27Z"
}