publish: 21 run(s) — 09d8fbde-0008-49bb-99da-03eeaca72be1, 1bf57c9a-fd7a-49aa-90de-cd1907b15ddd, 212d6278-1b9b-45e9-8aae-7eed4d4ec822…

This commit is contained in:
2026-05-06 14:28:25 +02:00
parent 947c361b9c
commit ddc9626136
22 changed files with 24099 additions and 314 deletions

View File

@@ -3,7 +3,7 @@
"title": "vps50-cpu-matrix-1 \u2014 gemma/phi/qwen2.5/qwen3 on vps50",
"date": "2026-05-05",
"started_at": "2026-05-05T10:23:13Z",
"git_sha": "f06800254dfd046e154c94f663fb7f9f66c79ae3",
"git_sha": "3ff8bd1808a1df00426d9b447559c774e4704c39",
"hardware": "vps50",
"hardware_label": "VPS50 \u00b7 cloud \u00b7 16 vCPU AMD EPYC \u00b7 62 GB RAM \u00b7 no GPU",
"engine": "llamacpp",
@@ -126,7 +126,11 @@
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": []
},
{
"cell_id": "vps50:llamacpp:gemma-4-26b-a4b",
@@ -138,7 +142,11 @@
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": []
},
{
"cell_id": "vps50:llamacpp:qwen3-30b-a3b",
@@ -150,7 +158,11 @@
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": []
},
{
"cell_id": "vps50:llamacpp:qwen2.5-72b",
@@ -162,7 +174,11 @@
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": []
},
{
"cell_id": "vps50:llamacpp:gemma-4-26b-a4b-it-q4km-cpu-ctx32k",
@@ -174,7 +190,37 @@
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": {
"unknown": {
"n_calls": 2,
"n_errors": 0,
"duration_ms_mean": null,
"duration_ms_p50": null,
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null
}
},
"chars_split": null,
"timeline": [
{
"prompt_id": null,
"run_idx": null,
"phase": null,
"duration_ms": null,
"tokens_per_sec": null,
"error": null
},
{
"prompt_id": null,
"run_idx": null,
"phase": null,
"duration_ms": null,
"tokens_per_sec": null,
"error": null
}
]
}
],
"n_calls_total": 2,
@@ -203,7 +249,8 @@
},
"synthesis_doc": "A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
"synthesis_docs_all": [
"A3B_AND_CPU_OVERNIGHT_2026-05-05.md"
"A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
"SITE_DATA_AUDIT_AND_MIGRATION_PLAN_2026-05-06.md"
],
"related_ids": [],
"status": "complete",
@@ -220,6 +267,10 @@
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": [],
"calls": []
},
{
@@ -233,6 +284,10 @@
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": [],
"calls": []
},
{
@@ -246,6 +301,10 @@
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": [],
"calls": []
},
{
@@ -259,6 +318,10 @@
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": [],
"calls": []
},
{
@@ -272,6 +335,36 @@
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": {
"unknown": {
"n_calls": 2,
"n_errors": 0,
"duration_ms_mean": null,
"duration_ms_p50": null,
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null
}
},
"chars_split": null,
"timeline": [
{
"prompt_id": null,
"run_idx": null,
"phase": null,
"duration_ms": null,
"tokens_per_sec": null,
"error": null
},
{
"prompt_id": null,
"run_idx": null,
"phase": null,
"duration_ms": null,
"tokens_per_sec": null,
"error": null
}
],
"calls": [
{
"type": "ram_snapshot",
@@ -311,5 +404,5 @@
"qwen2.5-72b"
]
},
"packaged_at": "2026-05-06T08:04:27Z"
"packaged_at": "2026-05-06T12:28:24Z"
}