publish: 21 run(s) — 09d8fbde-0008-49bb-99da-03eeaca72be1, 1bf57c9a-fd7a-49aa-90de-cd1907b15ddd, 212d6278-1b9b-45e9-8aae-7eed4d4ec822…
This commit is contained in:
@@ -1,8 +1,11 @@
|
||||
{
|
||||
"id": "fba9d9b1-cc5d-40bc-9e21-beafbb72c65d",
|
||||
"title": "Predator Qwen rerun \u2014 fba9d9b1-cc5d-40bc-9e21-beafbb72c65d",
|
||||
"title": "Predator Qwen rerun",
|
||||
"date": "2026-05-04",
|
||||
"started_at": "2026-05-04T17:49:07Z",
|
||||
"git_sha": "f06800254dfd046e154c94f663fb7f9f66c79ae3",
|
||||
"hardware": "predator",
|
||||
"hardware_label": "Predator \u00b7 gaming laptop \u00b7 GTX 1060 6 GB \u00b7 28 GB RAM",
|
||||
"engine": "llamacpp",
|
||||
"harness": "predator-qwen-rerun-1",
|
||||
"model_family": "qwen3/qwen3.5",
|
||||
@@ -10,12 +13,70 @@
|
||||
"qwen3.5:9b",
|
||||
"qwen3:14b"
|
||||
],
|
||||
"task_kind": null,
|
||||
"headline": "`Answer chars` is `len(message.content)`. Both averaged over the 3 warm runs.",
|
||||
"summary_md_path": "runs/fba9d9b1-cc5d-40bc-9e21-beafbb72c65d.md",
|
||||
"raw_jsonl_path": "runs/fba9d9b1-cc5d-40bc-9e21-beafbb72c65d.jsonl",
|
||||
"log_path": "runs/fba9d9b1-cc5d-40bc-9e21-beafbb72c65d.log",
|
||||
"synthesis_doc": "A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
|
||||
"task_kind": "chat",
|
||||
"tags": [
|
||||
"predator",
|
||||
"qwen3",
|
||||
"qwen3.5",
|
||||
"rerun"
|
||||
],
|
||||
"headline": "36 calls across 3 cell(s); ~10.9 tok/s mean; p50 24.1s",
|
||||
"janie_blurb_md": null,
|
||||
"janie_blurb_status": "pending",
|
||||
"caveat": null,
|
||||
"caveat_severity": null,
|
||||
"methodology_ref": "A3B_AND_CPU_OVERNIGHT_2026-05-05",
|
||||
"methodology_deviations_md": null,
|
||||
"results_table": [
|
||||
{
|
||||
"label": "qwen3.5:9b-q4km-think500",
|
||||
"cell_id": "predator:llamacpp:qwen3.5:9b-q4km-think500",
|
||||
"n_calls": 14,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 30474.33,
|
||||
"duration_ms_p50": 33717.5,
|
||||
"duration_ms_p95": 52611.55,
|
||||
"tokens_per_sec_mean": 14.25,
|
||||
"tokens_per_sec_p50": 14.91,
|
||||
"tokens_per_sec_p95": 15.3,
|
||||
"tokens_per_sec_max": 15.32,
|
||||
"memory_mb": null,
|
||||
"watts_avg": null,
|
||||
"notes": null
|
||||
},
|
||||
{
|
||||
"label": "qwen3.5:9b-q4km-nothink",
|
||||
"cell_id": "predator:llamacpp:qwen3.5:9b-q4km-nothink",
|
||||
"n_calls": 14,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 10425.75,
|
||||
"duration_ms_p50": 7200.0,
|
||||
"duration_ms_p95": 23998.85,
|
||||
"tokens_per_sec_mean": 12.55,
|
||||
"tokens_per_sec_p50": 14.37,
|
||||
"tokens_per_sec_p95": 14.93,
|
||||
"tokens_per_sec_max": 14.95,
|
||||
"memory_mb": null,
|
||||
"watts_avg": null,
|
||||
"notes": null
|
||||
},
|
||||
{
|
||||
"label": "qwen3:14b-q4km",
|
||||
"cell_id": "predator:llamacpp:qwen3:14b-q4km",
|
||||
"n_calls": 8,
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 130876.17,
|
||||
"duration_ms_p50": 78946.0,
|
||||
"duration_ms_p95": 277160.0,
|
||||
"tokens_per_sec_mean": 1.06,
|
||||
"tokens_per_sec_p50": 1.09,
|
||||
"tokens_per_sec_p95": 1.28,
|
||||
"tokens_per_sec_max": 1.33,
|
||||
"memory_mb": null,
|
||||
"watts_avg": null,
|
||||
"notes": null
|
||||
}
|
||||
],
|
||||
"cells": [
|
||||
{
|
||||
"cell_id": "predator:llamacpp:qwen3.5:9b-q4km-think500",
|
||||
@@ -23,7 +84,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 30474.33,
|
||||
"duration_ms_p50": 33717.5,
|
||||
"duration_ms_p95": 52611.55,
|
||||
"tokens_per_sec_mean": 14.25,
|
||||
"tokens_per_sec_p50": 14.91,
|
||||
"tokens_per_sec_p95": 15.3,
|
||||
"tokens_per_sec_max": 15.32
|
||||
},
|
||||
{
|
||||
@@ -32,7 +96,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 10425.75,
|
||||
"duration_ms_p50": 7200.0,
|
||||
"duration_ms_p95": 23998.85,
|
||||
"tokens_per_sec_mean": 12.55,
|
||||
"tokens_per_sec_p50": 14.37,
|
||||
"tokens_per_sec_p95": 14.93,
|
||||
"tokens_per_sec_max": 14.95
|
||||
},
|
||||
{
|
||||
@@ -41,19 +108,41 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 130876.17,
|
||||
"duration_ms_p50": 78946.0,
|
||||
"duration_ms_p95": 277160.0,
|
||||
"tokens_per_sec_mean": 1.06,
|
||||
"tokens_per_sec_p50": 1.09,
|
||||
"tokens_per_sec_p95": 1.28,
|
||||
"tokens_per_sec_max": 1.33
|
||||
}
|
||||
],
|
||||
"n_calls_total": 36,
|
||||
"n_errors_total": 0,
|
||||
"started_at": "2026-05-04T17:49:07Z",
|
||||
"tags": [
|
||||
"predator",
|
||||
"qwen3",
|
||||
"qwen3.5",
|
||||
"rerun"
|
||||
"chart_spec": {
|
||||
"kind": "bar",
|
||||
"x": "cell",
|
||||
"y": "tokens_per_sec_mean",
|
||||
"series": [
|
||||
"qwen3.5:9b-q4km-think500",
|
||||
"qwen3.5:9b-q4km-nothink",
|
||||
"qwen3:14b-q4km"
|
||||
],
|
||||
"data_url": "/data/fba9d9b1-cc5d-40bc-9e21-beafbb72c65d/run.jsonl"
|
||||
},
|
||||
"site_grade": "flagship",
|
||||
"site_grade_reason": null,
|
||||
"raw_data_urls": {
|
||||
"jsonl": "/data/fba9d9b1-cc5d-40bc-9e21-beafbb72c65d/run.jsonl",
|
||||
"log": "/data/fba9d9b1-cc5d-40bc-9e21-beafbb72c65d/run.log",
|
||||
"md": "/data/fba9d9b1-cc5d-40bc-9e21-beafbb72c65d/run.md",
|
||||
"metadata": "/data/fba9d9b1-cc5d-40bc-9e21-beafbb72c65d/metadata.json",
|
||||
"gitea_dir": "https://git.weeyuga.com/slobodanmargetic988/weeyuga-benchmarks-public/src/branch/main/runs/fba9d9b1-cc5d-40bc-9e21-beafbb72c65d/"
|
||||
},
|
||||
"synthesis_doc": "A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
|
||||
"synthesis_docs_all": [
|
||||
"A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
|
||||
"A3B_CROSS_MACHINE_2026-05-05.md"
|
||||
],
|
||||
"related_ids": [],
|
||||
"status": "complete",
|
||||
"visibility": "draft",
|
||||
"cells_full": [
|
||||
@@ -63,7 +152,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 30474.33,
|
||||
"duration_ms_p50": 33717.5,
|
||||
"duration_ms_p95": 52611.55,
|
||||
"tokens_per_sec_mean": 14.25,
|
||||
"tokens_per_sec_p50": 14.91,
|
||||
"tokens_per_sec_p95": 15.3,
|
||||
"tokens_per_sec_max": 15.32,
|
||||
"calls": [
|
||||
{
|
||||
@@ -278,7 +370,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 10425.75,
|
||||
"duration_ms_p50": 7200.0,
|
||||
"duration_ms_p95": 23998.85,
|
||||
"tokens_per_sec_mean": 12.55,
|
||||
"tokens_per_sec_p50": 14.37,
|
||||
"tokens_per_sec_p95": 14.93,
|
||||
"tokens_per_sec_max": 14.95,
|
||||
"calls": [
|
||||
{
|
||||
@@ -493,7 +588,10 @@
|
||||
"n_errors": 0,
|
||||
"duration_ms_mean": 130876.17,
|
||||
"duration_ms_p50": 78946.0,
|
||||
"duration_ms_p95": 277160.0,
|
||||
"tokens_per_sec_mean": 1.06,
|
||||
"tokens_per_sec_p50": 1.09,
|
||||
"tokens_per_sec_p95": 1.28,
|
||||
"tokens_per_sec_max": 1.33,
|
||||
"calls": [
|
||||
{
|
||||
@@ -637,5 +735,5 @@
|
||||
}
|
||||
}
|
||||
},
|
||||
"packaged_at": "2026-05-05T17:43:34Z"
|
||||
"packaged_at": "2026-05-06T08:04:27Z"
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user