{
  "evidenceVersion": "local-ollama-speed-v1",
  "capturedAt": "2026-06-01T21:37:47.079Z",
  "hardwareSlug": "rtx-3080-16gb-mobile",
  "modelTag": "gemma4:e2b",
  "catalogSlug": "gemma-4-e2b",
  "quant": "Q4_K_M",
  "contextSize": 4096,
  "numPredict": 256,
  "prompt": "Write a detailed explanation of how transformer attention works.",
  "scenario": "single-stream",
  "runtime": "ollama-api",
  "command": "POST http://localhost:11434/api/generate model=gemma4:e2b temperature=0 top_p=1 seed=42 num_ctx=4096 num_predict=256",
  "env": {
    "os": "Microsoft Windows [Version 10.0.26200.8457]",
    "platform": "win32",
    "arch": "x64",
    "cpu": "AMD Ryzen 9 5900HX with Radeon Graphics        ",
    "cpuThreads": 16,
    "ramGb": 31.9,
    "gpu": {
      "vendor": "nvidia",
      "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
      "driver": "571.96",
      "memoryTotalMb": 16384,
      "memoryUsedMb": 4862,
      "tempC": 68,
      "smClockMhz": 630,
      "powerDrawW": 30.14
    },
    "ollamaVersionCli": "ollama version is 0.24.0",
    "ollamaApiVersion": {
      "version": "0.24.0"
    }
  },
  "ollamaTagDetails": {
    "name": "gemma4:e2b",
    "model": "gemma4:e2b",
    "modified_at": "2026-06-02T00:37:17.8443429+03:00",
    "size": 7162405886,
    "digest": "7fbdbf8f5e45a75bb122155ed546e765b4d9c53a1285f62fd9f506baa1c5a47e",
    "details": {
      "parent_model": "",
      "format": "gguf",
      "family": "gemma4",
      "families": [
        "gemma4"
      ],
      "parameter_size": "5.1B",
      "quantization_level": "Q4_K_M"
    }
  },
  "notes": null,
  "logHashSha256": "02de93d01da2baae179b2ff0259688102a75ad3b3d9e46ded7a1a193c3591fcb",
  "runsCaptured": 5,
  "decodeStatsAllRuns": {
    "min": 98.1199188686252,
    "max": 101.16630123633519,
    "median": 98.5332706825954,
    "p5": 98.13652834976038,
    "p95": 100.92078912407851,
    "mean": 99.19223954738173,
    "n": 5
  },
  "decodeStatsSteadyRuns": {
    "min": 98.1199188686252,
    "max": 101.16630123633519,
    "median": 99.07085347467645,
    "p5": 98.13237597947658,
    "p95": 100.98216715214268,
    "mean": 99.35698176357833,
    "n": 4
  },
  "runs": [
    {
      "runIndex": 1,
      "startedAt": "2026-06-01T21:37:20.302Z",
      "finishedAt": "2026-06-01T21:37:32.041Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run1.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run1.log",
      "decodeTokPerSec": 98.5332706825954,
      "prefillTokPerSec": 581.3784483009215,
      "totalMs": 11648.9642,
      "loadMs": 8433.8578,
      "promptEvalMs": 44.7213,
      "evalMs": 2598.1072,
      "promptTokens": 26,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 4862,
        "tempC": 68,
        "smClockMhz": 630,
        "powerDrawW": 30.14
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 12087,
        "tempC": 74,
        "smClockMhz": 1725,
        "powerDrawW": 110.71
      }
    },
    {
      "runIndex": 2,
      "startedAt": "2026-06-01T21:37:32.130Z",
      "finishedAt": "2026-06-01T21:37:35.859Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run2.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run2.log",
      "decodeTokPerSec": 98.20296627430106,
      "prefillTokPerSec": 1851.614465381931,
      "totalMs": 3602.1838,
      "loadMs": 801.0859,
      "promptEvalMs": 14.0418,
      "evalMs": 2606.8459,
      "promptTokens": 26,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 12087,
        "tempC": 74,
        "smClockMhz": 1725,
        "powerDrawW": 110.71
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 12087,
        "tempC": 75,
        "smClockMhz": 1710,
        "powerDrawW": 109.84
      }
    },
    {
      "runIndex": 3,
      "startedAt": "2026-06-01T21:37:35.952Z",
      "finishedAt": "2026-06-01T21:37:39.624Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run3.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run3.log",
      "decodeTokPerSec": 98.1199188686252,
      "prefillTokPerSec": 1822.5533973096308,
      "totalMs": 3583.8954,
      "loadMs": 755.1229,
      "promptEvalMs": 14.2657,
      "evalMs": 2609.0523,
      "promptTokens": 26,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 12087,
        "tempC": 75,
        "smClockMhz": 1755,
        "powerDrawW": 104.01
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 12088,
        "tempC": 76,
        "smClockMhz": 1695,
        "powerDrawW": 113.46
      }
    },
    {
      "runIndex": 4,
      "startedAt": "2026-06-01T21:37:39.711Z",
      "finishedAt": "2026-06-01T21:37:43.420Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run4.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run4.log",
      "decodeTokPerSec": 99.93874067505183,
      "prefillTokPerSec": 1509.372623463778,
      "totalMs": 3622.0426,
      "loadMs": 805.5522,
      "promptEvalMs": 17.2257,
      "evalMs": 2561.5692,
      "promptTokens": 26,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 12088,
        "tempC": 76,
        "smClockMhz": 1695,
        "powerDrawW": 109.45
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 12088,
        "tempC": 77,
        "smClockMhz": 1710,
        "powerDrawW": 113.47
      }
    },
    {
      "runIndex": 5,
      "startedAt": "2026-06-01T21:37:43.507Z",
      "finishedAt": "2026-06-01T21:37:47.077Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run5.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma4-e2b/run5.log",
      "decodeTokPerSec": 101.16630123633519,
      "prefillTokPerSec": 1750.158187374628,
      "totalMs": 3490.7712,
      "loadMs": 708.2207,
      "promptEvalMs": 14.8558,
      "evalMs": 2530.4869,
      "promptTokens": 26,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 12088,
        "tempC": 77,
        "smClockMhz": 1755,
        "powerDrawW": 109.28
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 12087,
        "tempC": 77,
        "smClockMhz": 1710,
        "powerDrawW": 113.8
      }
    }
  ],
  "errors": [],
  "uploadEligible": true
}