{ "id": "ff1131ca-d021-4e06-8616-4b4cdb54e97e", "title": "pavilion-weeyuga-v1 \u2014 qwen2.5/qwen2.5-coder/qwen3/qwen3.5 on pavilion", "date": "2026-04-28", "started_at": "2026-04-28T21:03:46Z", "git_sha": "9934892784228748586130d8abbacd82a919aee2", "hardware": "pavilion", "hardware_label": "Pavilion \u00b7 HP laptop \u00b7 GTX 1050 4 GB \u00b7 16 GB RAM \u00b7 i7-9750H", "engine": "weeyuga", "harness": "pavilion-weeyuga-v1", "model_family": "qwen2.5/qwen2.5-coder/qwen3/qwen3.5", "model_sizes": [ "qwen3.5:4b", "qwen3.5:35b-a3b-uncensored", "qwen3.5:35b-a3b-iq2s", "qwen3.5:9b-q6k", "qwen3.5:9b", "qwen3.5:2b", "qwen3.5:0.8b", "qwen2.5-coder:14b", "qwen2.5-coder:3b", "qwen3:14b", "qwen3:8b", "qwen3:4b", "qwen2.5:3b", "qwen2.5-coder:1.5b", "qwen2.5-coder:0.5b" ], "task_kind": "chat", "tags": [ "a3b", "iq2", "pavilion", "qwen2.5", "qwen3", "qwen3.5", "weeyuga" ], "headline": "17 calls across 16 cell(s); 3 errors", "janie_blurb_md": null, "janie_blurb_status": "pending", "caveat": null, "caveat_severity": null, "methodology_ref": "PAVILION_WEEYUGA_v1", "methodology_deviations_md": null, "results_table": [ { "label": "qwen3.5:4b", "cell_id": "pavilion:weeyuga:qwen3.5:4b", "n_calls": 2, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3.5:35b-a3b-uncensored-iq1m", "cell_id": "pavilion:weeyuga:qwen3.5:35b-a3b-uncensored-iq1m", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3.5:35b-a3b-iq2s", "cell_id": "pavilion:weeyuga:qwen3.5:35b-a3b-iq2s", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3.5:9b-q6k", "cell_id": "pavilion:weeyuga:qwen3.5:9b-q6k", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3.5:9b-q4km", "cell_id": "pavilion:weeyuga:qwen3.5:9b-q4km", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3.5:2b", "cell_id": "pavilion:weeyuga:qwen3.5:2b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3.5:0.8b", "cell_id": "pavilion:weeyuga:qwen3.5:0.8b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3.5:9b", "cell_id": "pavilion:weeyuga:qwen3.5:9b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen2.5-coder:14b", "cell_id": "pavilion:weeyuga:qwen2.5-coder:14b", "n_calls": 1, "n_errors": 1, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen2.5-coder:3b", "cell_id": "pavilion:weeyuga:qwen2.5-coder:3b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3:14b", "cell_id": "pavilion:weeyuga:qwen3:14b", "n_calls": 1, "n_errors": 1, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3:8b", "cell_id": "pavilion:weeyuga:qwen3:8b", "n_calls": 1, "n_errors": 1, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen3:4b", "cell_id": "pavilion:weeyuga:qwen3:4b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen2.5:3b", "cell_id": "pavilion:weeyuga:qwen2.5:3b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen2.5-coder:1.5b", "cell_id": "pavilion:weeyuga:qwen2.5-coder:1.5b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null }, { "label": "qwen2.5-coder:0.5b", "cell_id": "pavilion:weeyuga:qwen2.5-coder:0.5b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "memory_mb": null, "watts_avg": null, "notes": null } ], "cells": [ { "cell_id": "pavilion:weeyuga:qwen3.5:4b", "n_calls": 2, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3.5:35b-a3b-uncensored-iq1m", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3.5:35b-a3b-iq2s", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3.5:9b-q6k", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3.5:9b-q4km", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3.5:2b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3.5:0.8b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3.5:9b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen2.5-coder:14b", "n_calls": 1, "n_errors": 1, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen2.5-coder:3b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3:14b", "n_calls": 1, "n_errors": 1, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3:8b", "n_calls": 1, "n_errors": 1, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen3:4b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen2.5:3b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen2.5-coder:1.5b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null }, { "cell_id": "pavilion:weeyuga:qwen2.5-coder:0.5b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null } ], "n_calls_total": 17, "n_errors_total": 3, "chart_spec": { "kind": "bar", "x": "cell", "y": "tokens_per_sec_mean", "series": [ "qwen3.5:4b", "qwen3.5:35b-a3b-uncensored-iq1m", "qwen3.5:35b-a3b-iq2s", "qwen3.5:9b-q6k", "qwen3.5:9b-q4km", "qwen3.5:2b", "qwen3.5:0.8b", "qwen3.5:9b", "qwen2.5-coder:14b", "qwen2.5-coder:3b", "qwen3:14b", "qwen3:8b", "qwen3:4b", "qwen2.5:3b", "qwen2.5-coder:1.5b", "qwen2.5-coder:0.5b" ], "data_url": "/data/ff1131ca-d021-4e06-8616-4b4cdb54e97e/run.jsonl" }, "site_grade": "archive-only", "site_grade_reason": "error rate 3/17", "raw_data_urls": { "jsonl": "/data/ff1131ca-d021-4e06-8616-4b4cdb54e97e/run.jsonl", "log": null, "md": null, "metadata": "/data/ff1131ca-d021-4e06-8616-4b4cdb54e97e/metadata.json", "gitea_dir": "https://git.weeyuga.com/slobodanmargetic988/weeyuga-benchmarks-public/src/branch/main/runs/ff1131ca-d021-4e06-8616-4b4cdb54e97e/" }, "synthesis_doc": "PAVILION_WEEYUGA_v1.md", "synthesis_docs_all": [ "PAVILION_WEEYUGA_v1.md", "PAVILION_LLAMACPP_VS_OLLAMA_v0_INCOMPLETE.md" ], "related_ids": [], "status": "complete", "visibility": "draft", "cells_full": [ { "cell_id": "pavilion:weeyuga:qwen3.5:4b", "n_calls": 2, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:03:50Z", "cell_id": "pavilion:weeyuga:qwen3.5:4b", "model": "qwen3.5:4b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 4.039, "prompt_tokens": 16, "completion_tokens": 128, "tokens_per_second": 31.69, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 57, "response_preview": "Hello! I'm glad to help you. What would you like to do? \ud83d\ude0a", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null }, { "type": "call", "ts_utc": "2026-04-28T21:33:26Z", "cell_id": "pavilion:weeyuga:qwen3.5:4b", "model": "qwen3.5:4b", "phase": "5q", "question_id": "disk_guard_bash", "run_idx": 0, "duration_seconds": 32.117, "prompt_tokens": 71, "completion_tokens": 1125, "tokens_per_second": 35.03, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 247, "response_preview": "#!/bin/bash\n\n# Check disk usage for /\nif [ -d \"/\" ]; then\n disk_usage=$(df -P / | awk '{print $5}')\n if [ \"$disk_usage\" -gt 85 ]; then\n echo \"WARNING: Disk usage for / is at ${disk_usage}% (above 85%)\"\n exit 1\n fi\nfi\n", "required_markers": [ "#!/usr/bin/env bash", "df -P /", "85", "exit 1" ], "markers_hit": [ "df -P /", "85", "exit 1" ], "marker_hit_rate": 0.75, "format_rule": "bash_code", "format_ok": false, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen3.5:35b-a3b-uncensored-iq1m", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:03:56Z", "cell_id": "pavilion:weeyuga:qwen3.5:35b-a3b-uncensored-iq1m", "model": "qwen3.5:35b-a3b-uncensored-iq1m", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 5.989, "prompt_tokens": 16, "completion_tokens": 226, "tokens_per_second": 37.74, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 91, "response_preview": "Hello! I'd be happy to help you with anything you need. What can I assist you with today? \ud83d\ude0a", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen3.5:35b-a3b-iq2s", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:04:00Z", "cell_id": "pavilion:weeyuga:qwen3.5:35b-a3b-iq2s", "model": "qwen3.5:35b-a3b-iq2s", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 4.033, "prompt_tokens": 16, "completion_tokens": 126, "tokens_per_second": 31.24, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 57, "response_preview": "Hello! I'd love to help you. What would you like to do? \ud83d\ude0a", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen3.5:9b-q6k", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:04:03Z", "cell_id": "pavilion:weeyuga:qwen3.5:9b-q6k", "model": "qwen3.5:9b-q6k", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 3.754, "prompt_tokens": 16, "completion_tokens": 139, "tokens_per_second": 37.03, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 159, "response_preview": "Hello! I'd love to help you. What would you like to work on today? Whether it's writing, coding, problem-solving, or just chatting, feel free to let me know! \ud83d\ude0a", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen3.5:9b-q4km", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:04:07Z", "cell_id": "pavilion:weeyuga:qwen3.5:9b-q4km", "model": "qwen3.5:9b-q4km", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 3.684, "prompt_tokens": 16, "completion_tokens": 143, "tokens_per_second": 38.82, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 61, "response_preview": "Hello! I'd be happy to help you. What would you like to do? \ud83d\ude0a", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen3.5:2b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:04:12Z", "cell_id": "pavilion:weeyuga:qwen3.5:2b", "model": "qwen3.5:2b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 4.749, "prompt_tokens": 16, "completion_tokens": 180, "tokens_per_second": 37.9, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 187, "response_preview": "Hello! I'd love to help you. What would you like to work on today? Whether it's learning a new skill, solving a problem, brainstorming ideas, or just chatting, feel free to let me know! \ud83d\ude0a", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen3.5:0.8b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:04:15Z", "cell_id": "pavilion:weeyuga:qwen3.5:0.8b", "model": "qwen3.5:0.8b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 3.479, "prompt_tokens": 16, "completion_tokens": 133, "tokens_per_second": 38.23, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 63, "response_preview": "Hello! I'd love to help you. What would you like to do today? \ud83d\ude0a", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen3.5:9b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:04:42Z", "cell_id": "pavilion:weeyuga:qwen3.5:9b", "model": "qwen3.5:9b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 26.517, "prompt_tokens": 16, "completion_tokens": 1081, "tokens_per_second": 40.77, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 179, "response_preview": "Hi! I'd be happy to help you. What would you like to do today? I can assist with a wide range of tasks, from writing code to answering questions. Please let me know what you need.", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen2.5-coder:14b", "n_calls": 1, "n_errors": 1, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:10:42Z", "cell_id": "pavilion:weeyuga:qwen2.5-coder:14b", "model": "qwen2.5-coder:14b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 360.061, "prompt_tokens": null, "completion_tokens": null, "tokens_per_second": null, "finish_reason": null, "weeyuga_meta": null, "status_code": null, "response_chars": 0, "response_preview": "", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": false, "error": "TimeoutError('timed out')" } ] }, { "cell_id": "pavilion:weeyuga:qwen2.5-coder:3b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:15:12Z", "cell_id": "pavilion:weeyuga:qwen2.5-coder:3b", "model": "qwen2.5-coder:3b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 269.603, "prompt_tokens": 35, "completion_tokens": 17, "tokens_per_second": 0.06, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 62, "response_preview": "Of course! I'm here to help. What do you need assistance with?", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen3:14b", "n_calls": 1, "n_errors": 1, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:21:12Z", "cell_id": "pavilion:weeyuga:qwen3:14b", "model": "qwen3:14b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 360.083, "prompt_tokens": null, "completion_tokens": null, "tokens_per_second": null, "finish_reason": null, "weeyuga_meta": null, "status_code": null, "response_chars": 0, "response_preview": "", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": false, "error": "TimeoutError('timed out')" } ] }, { "cell_id": "pavilion:weeyuga:qwen3:8b", "n_calls": 1, "n_errors": 1, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:27:12Z", "cell_id": "pavilion:weeyuga:qwen3:8b", "model": "qwen3:8b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 360.084, "prompt_tokens": null, "completion_tokens": null, "tokens_per_second": null, "finish_reason": null, "weeyuga_meta": null, "status_code": null, "response_chars": 0, "response_preview": "", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": false, "error": "TimeoutError('timed out')" } ] }, { "cell_id": "pavilion:weeyuga:qwen3:4b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:31:48Z", "cell_id": "pavilion:weeyuga:qwen3:4b", "model": "qwen3:4b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 276.449, "prompt_tokens": 16, "completion_tokens": 457, "tokens_per_second": 1.65, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 502, "response_preview": "Of course! \ud83d\ude0a I'm here to help with **anything** you need \u2014 whether it's homework, tech issues, writing, math, science, life advice, or just brainstorming ideas. \n\n**Just tell me:** \n- What\u2019s *specifically* on your mind? \n- What\u2019s stuck? ", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen2.5:3b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:32:19Z", "cell_id": "pavilion:weeyuga:qwen2.5:3b", "model": "qwen2.5:3b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 31.33, "prompt_tokens": 35, "completion_tokens": 50, "tokens_per_second": 1.6, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 208, "response_preview": "Of course! I'd be happy to help. What can I assist you with today? Whether it's information on cloud computing services, general advice, or any other query, feel free to ask and I'll do my best to assist you.", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen2.5-coder:1.5b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:32:40Z", "cell_id": "pavilion:weeyuga:qwen2.5-coder:1.5b", "model": "qwen2.5-coder:1.5b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 20.572, "prompt_tokens": 35, "completion_tokens": 11, "tokens_per_second": 0.53, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 38, "response_preview": "Of course! How may I assist you today?", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] }, { "cell_id": "pavilion:weeyuga:qwen2.5-coder:0.5b", "n_calls": 1, "n_errors": 0, "duration_ms_mean": null, "duration_ms_p50": null, "duration_ms_p95": null, "tokens_per_sec_mean": null, "tokens_per_sec_p50": null, "tokens_per_sec_p95": null, "tokens_per_sec_max": null, "calls": [ { "type": "call", "ts_utc": "2026-04-28T21:32:53Z", "cell_id": "pavilion:weeyuga:qwen2.5-coder:0.5b", "model": "qwen2.5-coder:0.5b", "phase": "hello", "question_id": "hello_check", "run_idx": 0, "duration_seconds": 13.367, "prompt_tokens": 35, "completion_tokens": 11, "tokens_per_second": 0.82, "finish_reason": "stop", "weeyuga_meta": null, "status_code": 200, "response_chars": 38, "response_preview": "Of course! How can I assist you today?", "required_markers": [], "markers_hit": [], "marker_hit_rate": null, "format_rule": "", "format_ok": null, "usable_answer": true, "error": null } ] } ], "meta_record": { "type": "meta", "benchmark_run_id": "ff1131ca-d021-4e06-8616-4b4cdb54e97e", "harness_version": "1", "harness_path": "scripts/benchmarks/run_pavilion_weeyuga.py", "git_sha": "9934892784228748586130d8abbacd82a919aee2", "git_dirty": true, "started_at_utc": "2026-04-28T21:03:46Z", "host": "Slobodans-MacBook-Air.local", "load_avg_start": [ 2.5576171875, 2.47900390625, 2.16552734375 ], "weeyuga_url": "http://10.8.0.3:11435", "phase_plan": "hello+5q", "models_planned": [ "qwen3.5:4b", "qwen3.5:35b-a3b-uncensored-iq1m", "qwen3.5:35b-a3b-iq2s", "qwen3.5:9b-q6k", "qwen3.5:9b-q4km", "qwen3.5:2b", "qwen3.5:0.8b", "qwen3.5:9b", "qwen2.5-coder:14b", "qwen2.5-coder:3b", "qwen3:14b", "qwen3:8b", "qwen3:4b", "qwen2.5:3b", "qwen2.5-coder:1.5b", "qwen2.5-coder:0.5b" ], "canonical_options": { "temperature": 0.1, "num_ctx": 4096, "num_predict": 2048 }, "timeout_seconds": 360, "suite_5q_path": "/Users/slobodan/Documents/MyServers/instances/vps-81-17-99-14/telemetry/small_model_eval_questions.json", "suite_20q_path": "/Users/slobodan/Documents/MyServers/instances/vps-81-17-99-14/telemetry/python_task_suite_questions.json", "env_inference_route": null, "env_llamacpp_url": null }, "packaged_at": "2026-05-06T08:04:27Z" }