publish: 21 run(s) — 09d8fbde-0008-49bb-99da-03eeaca72be1, 1bf57c9a-fd7a-49aa-90de-cd1907b15ddd, 212d6278-1b9b-45e9-8aae-7eed4d4ec822…

This commit is contained in:
2026-05-06 14:28:25 +02:00
parent 947c361b9c
commit ddc9626136
22 changed files with 24099 additions and 314 deletions

View File

@@ -3,7 +3,7 @@
"title": "vps50-cpu-matrix-1 \u2014 gemma/phi/qwen2.5/qwen3 on vps50",
"date": "2026-05-05",
"started_at": "2026-05-05T07:00:10Z",
"git_sha": "f06800254dfd046e154c94f663fb7f9f66c79ae3",
"git_sha": "3ff8bd1808a1df00426d9b447559c774e4704c39",
"hardware": "vps50",
"hardware_label": "VPS50 \u00b7 cloud \u00b7 16 vCPU AMD EPYC \u00b7 62 GB RAM \u00b7 no GPU",
"engine": "llamacpp",
@@ -125,7 +125,11 @@
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": []
},
{
"cell_id": "vps50:llamacpp:gemma-4-26b-a4b",
@@ -137,7 +141,11 @@
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": []
},
{
"cell_id": "vps50:llamacpp:qwen3-30b-a3b",
@@ -149,7 +157,11 @@
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": []
},
{
"cell_id": "vps50:llamacpp:qwen2.5-72b",
@@ -161,7 +173,11 @@
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": []
},
{
"cell_id": "vps50:llamacpp:phi-4-q4km-cpu-ctx32k",
@@ -173,7 +189,94 @@
"tokens_per_sec_mean": 0.02,
"tokens_per_sec_p50": 0.02,
"tokens_per_sec_p95": 0.02,
"tokens_per_sec_max": 0.02
"tokens_per_sec_max": 0.02,
"cold_warm_split": {
"cold": {
"n_calls": 1,
"duration_ms_mean": 540002.0,
"duration_ms_p50": 540002.0,
"tokens_per_sec_mean": 0.02
},
"warm": {
"n_calls": 3,
"duration_ms_mean": 551918.67,
"duration_ms_p50": 515603.0,
"tokens_per_sec_mean": 0.02
}
},
"per_prompt": {
"unknown": {
"n_calls": 2,
"n_errors": 0,
"duration_ms_mean": null,
"duration_ms_p50": null,
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null
},
"hello": {
"n_calls": 4,
"n_errors": 0,
"duration_ms_mean": 548939.5,
"duration_ms_p50": 527802.5,
"tokens_per_sec_mean": 0.02,
"tokens_per_sec_p50": 0.02
}
},
"chars_split": {
"has_thinking": false,
"reasoning_chars_mean": 0.0,
"answer_chars_mean": 34.0
},
"timeline": [
{
"prompt_id": null,
"run_idx": null,
"phase": null,
"duration_ms": null,
"tokens_per_sec": null,
"error": null
},
{
"prompt_id": null,
"run_idx": null,
"phase": null,
"duration_ms": null,
"tokens_per_sec": null,
"error": null
},
{
"prompt_id": "hello",
"run_idx": 0,
"phase": "cold",
"duration_ms": 540002,
"tokens_per_sec": 0.01851844993166692,
"error": null
},
{
"prompt_id": "hello",
"run_idx": 1,
"phase": "warm",
"duration_ms": 628077,
"tokens_per_sec": 0.015921614706477072,
"error": null
},
{
"prompt_id": "hello",
"run_idx": 2,
"phase": "warm",
"duration_ms": 512076,
"tokens_per_sec": 0.01952835126035979,
"error": null
},
{
"prompt_id": "hello",
"run_idx": 3,
"phase": "warm",
"duration_ms": 515603,
"tokens_per_sec": 0.019394766903993967,
"error": null
}
]
}
],
"n_calls_total": 6,
@@ -202,7 +305,8 @@
},
"synthesis_doc": "A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
"synthesis_docs_all": [
"A3B_AND_CPU_OVERNIGHT_2026-05-05.md"
"A3B_AND_CPU_OVERNIGHT_2026-05-05.md",
"SITE_DATA_AUDIT_AND_MIGRATION_PLAN_2026-05-06.md"
],
"related_ids": [],
"status": "complete",
@@ -219,6 +323,10 @@
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": [],
"calls": []
},
{
@@ -232,6 +340,10 @@
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": [],
"calls": []
},
{
@@ -245,6 +357,10 @@
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": [],
"calls": []
},
{
@@ -258,6 +374,10 @@
"tokens_per_sec_p50": null,
"tokens_per_sec_p95": null,
"tokens_per_sec_max": null,
"cold_warm_split": null,
"per_prompt": null,
"chars_split": null,
"timeline": [],
"calls": []
},
{
@@ -271,6 +391,93 @@
"tokens_per_sec_p50": 0.02,
"tokens_per_sec_p95": 0.02,
"tokens_per_sec_max": 0.02,
"cold_warm_split": {
"cold": {
"n_calls": 1,
"duration_ms_mean": 540002.0,
"duration_ms_p50": 540002.0,
"tokens_per_sec_mean": 0.02
},
"warm": {
"n_calls": 3,
"duration_ms_mean": 551918.67,
"duration_ms_p50": 515603.0,
"tokens_per_sec_mean": 0.02
}
},
"per_prompt": {
"unknown": {
"n_calls": 2,
"n_errors": 0,
"duration_ms_mean": null,
"duration_ms_p50": null,
"tokens_per_sec_mean": null,
"tokens_per_sec_p50": null
},
"hello": {
"n_calls": 4,
"n_errors": 0,
"duration_ms_mean": 548939.5,
"duration_ms_p50": 527802.5,
"tokens_per_sec_mean": 0.02,
"tokens_per_sec_p50": 0.02
}
},
"chars_split": {
"has_thinking": false,
"reasoning_chars_mean": 0.0,
"answer_chars_mean": 34.0
},
"timeline": [
{
"prompt_id": null,
"run_idx": null,
"phase": null,
"duration_ms": null,
"tokens_per_sec": null,
"error": null
},
{
"prompt_id": null,
"run_idx": null,
"phase": null,
"duration_ms": null,
"tokens_per_sec": null,
"error": null
},
{
"prompt_id": "hello",
"run_idx": 0,
"phase": "cold",
"duration_ms": 540002,
"tokens_per_sec": 0.01851844993166692,
"error": null
},
{
"prompt_id": "hello",
"run_idx": 1,
"phase": "warm",
"duration_ms": 628077,
"tokens_per_sec": 0.015921614706477072,
"error": null
},
{
"prompt_id": "hello",
"run_idx": 2,
"phase": "warm",
"duration_ms": 512076,
"tokens_per_sec": 0.01952835126035979,
"error": null
},
{
"prompt_id": "hello",
"run_idx": 3,
"phase": "warm",
"duration_ms": 515603,
"tokens_per_sec": 0.019394766903993967,
"error": null
}
],
"calls": [
{
"type": "ram_snapshot",
@@ -374,5 +581,5 @@
"qwen2.5-72b"
]
},
"packaged_at": "2026-05-06T08:04:27Z"
"packaged_at": "2026-05-06T12:28:24Z"
}