﻿{
    "tested_at":  "2026-06-16T15:31:18-05:00",
    "host_cpu":  "AMD Ryzen 7 9800X3D 8-Core Processor",
    "host_logical_processors":  16,
    "host_physical_memory_gb":  31.1,
    "docker_container":  "aijupyter-8gb-cpu-ollama",
    "docker_memory_limit":  "8GiB",
    "docker_gpu_requests":  "null",
    "ollama_version":  "ollama version is 0.30.8",
    "prompt":  "Write a concise 6-bullet recommendation for running a private local AI assistant on an 8GB RAM CPU-only laptop. Mention model size, context length, and what to avoid.",
    "options":  {
                    "temperature":  0,
                    "num_predict":  128,
                    "num_ctx":  2048
                },
    "results":  [
                    {
                        "model":  "qwen2.5:0.5b",
                        "status":  "ok",
                        "wall_seconds":  2.47,
                        "eval_count":  128,
                        "eval_duration_ns":  2206121000,
                        "tokens_per_second":  58.02,
                        "prompt_eval_count":  66,
                        "prompt_eval_duration_ns":  37710000,
                        "prompt_tokens_per_second":  1750.2,
                        "load_duration_ns":  158483846,
                        "total_duration_ns":  2413691026,
                        "docker_stats":  "0.01%|1003MiB / 8GiB|12.24%"
                    },
                    {
                        "model":  "gemma3:1b",
                        "status":  "ok",
                        "wall_seconds":  7.32,
                        "eval_count":  128,
                        "eval_duration_ns":  4169152000,
                        "tokens_per_second":  30.7,
                        "prompt_eval_count":  48,
                        "prompt_eval_duration_ns":  167221000,
                        "prompt_tokens_per_second":  287.05,
                        "load_duration_ns":  2971953639,
                        "total_duration_ns":  7314357684,
                        "docker_stats":  "0.00%|2.132GiB / 8GiB|26.65%"
                    },
                    {
                        "model":  "llama3.2:1b",
                        "status":  "ok",
                        "wall_seconds":  7.87,
                        "eval_count":  128,
                        "eval_duration_ns":  4943054000,
                        "tokens_per_second":  25.89,
                        "prompt_eval_count":  62,
                        "prompt_eval_duration_ns":  195995000,
                        "prompt_tokens_per_second":  316.33,
                        "load_duration_ns":  2724832460,
                        "total_duration_ns":  7866306547,
                        "docker_stats":  "0.00%|3.295GiB / 8GiB|41.18%"
                    },
                    {
                        "model":  "qwen2.5:1.5b",
                        "status":  "ok",
                        "wall_seconds":  7.65,
                        "eval_count":  128,
                        "eval_duration_ns":  4989917000,
                        "tokens_per_second":  25.65,
                        "prompt_eval_count":  66,
                        "prompt_eval_duration_ns":  199240000,
                        "prompt_tokens_per_second":  331.26,
                        "load_duration_ns":  2451435000,
                        "total_duration_ns":  7643440955,
                        "docker_stats":  "0.00%|3.88GiB / 8GiB|48.50%"
                    },
                    {
                        "model":  "qwen2.5:3b",
                        "status":  "ok",
                        "wall_seconds":  13.94,
                        "eval_count":  128,
                        "eval_duration_ns":  7631340000,
                        "tokens_per_second":  16.77,
                        "prompt_eval_count":  66,
                        "prompt_eval_duration_ns":  350267000,
                        "prompt_tokens_per_second":  188.43,
                        "load_duration_ns":  5955588356,
                        "total_duration_ns":  13940555830,
                        "docker_stats":  "0.00%|4.45GiB / 8GiB|55.63%"
                    },
                    {
                        "model":  "qwen2.5:7b",
                        "status":  "ok",
                        "wall_seconds":  30.07,
                        "eval_count":  128,
                        "eval_duration_ns":  17913700000,
                        "tokens_per_second":  7.15,
                        "prompt_eval_count":  66,
                        "prompt_eval_duration_ns":  868451000,
                        "prompt_tokens_per_second":  76,
                        "load_duration_ns":  11277969475,
                        "total_duration_ns":  30064768560,
                        "docker_stats":  "0.00%|6.409GiB / 8GiB|80.11%"
                    }
                ]
}
