{
  "evidenceVersion": "local-ollama-speed-v1",
  "capturedAt": "2026-06-01T21:36:38.744Z",
  "hardwareSlug": "rtx-3080-16gb-mobile",
  "modelTag": "gemma3:1b",
  "catalogSlug": "gemma-3-1b",
  "quant": "Q4_K_M",
  "contextSize": 4096,
  "numPredict": 256,
  "prompt": "Write a detailed explanation of how transformer attention works.",
  "scenario": "single-stream",
  "runtime": "ollama-api",
  "command": "POST http://localhost:11434/api/generate model=gemma3:1b temperature=0 top_p=1 seed=42 num_ctx=4096 num_predict=256",
  "env": {
    "os": "Microsoft Windows [Version 10.0.26200.8457]",
    "platform": "win32",
    "arch": "x64",
    "cpu": "AMD Ryzen 9 5900HX with Radeon Graphics        ",
    "cpuThreads": 16,
    "ramGb": 31.9,
    "gpu": {
      "vendor": "nvidia",
      "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
      "driver": "571.96",
      "memoryTotalMb": 16384,
      "memoryUsedMb": 1889,
      "tempC": 65,
      "smClockMhz": 495,
      "powerDrawW": 29.91
    },
    "ollamaVersionCli": "ollama version is 0.24.0",
    "ollamaApiVersion": {
      "version": "0.24.0"
    }
  },
  "ollamaTagDetails": {
    "name": "gemma3:1b",
    "model": "gemma3:1b",
    "modified_at": "2026-06-02T00:30:36.8238262+03:00",
    "size": 815319791,
    "digest": "8648f39daa8fbf5b18c7b4e6a8fb4990c692751d49917417b8842ca5758e7ffc",
    "details": {
      "parent_model": "",
      "format": "gguf",
      "family": "gemma3",
      "families": [
        "gemma3"
      ],
      "parameter_size": "999.89M",
      "quantization_level": "Q4_K_M"
    }
  },
  "notes": null,
  "logHashSha256": "686a16dfa5f9805daf2179c826767958486b0fa299819350b2f09b33cd30f4b0",
  "runsCaptured": 5,
  "decodeStatsAllRuns": {
    "min": 156.4072759931633,
    "max": 162.17874987044706,
    "median": 160.08196196452582,
    "p5": 157.04777560526276,
    "p95": 161.89323392117637,
    "mean": 159.80578640117807,
    "n": 5
  },
  "decodeStatsSteadyRuns": {
    "min": 159.60977405366054,
    "max": 162.17874987044706,
    "median": 160.41656604430972,
    "p5": 159.68060224029034,
    "p95": 161.96461290849405,
    "mean": 160.65541400318176,
    "n": 4
  },
  "runs": [
    {
      "runIndex": 1,
      "startedAt": "2026-06-01T21:36:22.162Z",
      "finishedAt": "2026-06-01T21:36:27.704Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run1.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run1.log",
      "decodeTokPerSec": 156.4072759931633,
      "prefillTokPerSec": 619.8212305082534,
      "totalMs": 5446.0612,
      "loadMs": 3466.5506,
      "promptEvalMs": 30.654,
      "evalMs": 1636.7525,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "061e3c2e6b8167ede2ef1c1bfa820333ece192407b83848a7d2eaa33bad70425",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 1889,
        "tempC": 65,
        "smClockMhz": 495,
        "powerDrawW": 29.87
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 3005,
        "tempC": 69,
        "smClockMhz": 1770,
        "powerDrawW": 100.42
      }
    },
    {
      "runIndex": 2,
      "startedAt": "2026-06-01T21:36:27.776Z",
      "finishedAt": "2026-06-01T21:36:30.460Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run2.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run2.log",
      "decodeTokPerSec": 159.60977405366054,
      "prefillTokPerSec": 2138.026489022922,
      "totalMs": 2599.8083,
      "loadMs": 797.2129,
      "promptEvalMs": 8.8867,
      "evalMs": 1603.9118,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "2e9817875a48ba45139b7f93502ad28f13e238840a506d1be7d5b8361b344d25",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 3005,
        "tempC": 69,
        "smClockMhz": 1770,
        "powerDrawW": 95.75
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 3005,
        "tempC": 70,
        "smClockMhz": 1770,
        "powerDrawW": 99.56
      }
    },
    {
      "runIndex": 3,
      "startedAt": "2026-06-01T21:36:30.537Z",
      "finishedAt": "2026-06-01T21:36:33.200Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run3.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run3.log",
      "decodeTokPerSec": 160.75117012409362,
      "prefillTokPerSec": 2137.7378233328454,
      "totalMs": 2548.7822,
      "loadMs": 745.6233,
      "promptEvalMs": 8.8879,
      "evalMs": 1592.5234,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "2e9817875a48ba45139b7f93502ad28f13e238840a506d1be7d5b8361b344d25",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 3005,
        "tempC": 70,
        "smClockMhz": 1770,
        "powerDrawW": 99.56
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 3001,
        "tempC": 70,
        "smClockMhz": 1755,
        "powerDrawW": 100.41
      }
    },
    {
      "runIndex": 4,
      "startedAt": "2026-06-01T21:36:33.276Z",
      "finishedAt": "2026-06-01T21:36:35.957Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run4.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run4.log",
      "decodeTokPerSec": 162.17874987044706,
      "prefillTokPerSec": 1909.3750314041945,
      "totalMs": 2585.6524,
      "loadMs": 764.0066,
      "promptEvalMs": 9.9509,
      "evalMs": 1578.5052,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "2e9817875a48ba45139b7f93502ad28f13e238840a506d1be7d5b8361b344d25",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 3001,
        "tempC": 70,
        "smClockMhz": 1755,
        "powerDrawW": 95.44
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 3001,
        "tempC": 72,
        "smClockMhz": 1755,
        "powerDrawW": 98.7
      }
    },
    {
      "runIndex": 5,
      "startedAt": "2026-06-01T21:36:36.032Z",
      "finishedAt": "2026-06-01T21:36:38.742Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run5.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/gemma3-1b/run5.log",
      "decodeTokPerSec": 160.08196196452582,
      "prefillTokPerSec": 2176.7772240362033,
      "totalMs": 2629.2376,
      "loadMs": 807.6856,
      "promptEvalMs": 8.7285,
      "evalMs": 1599.1808,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "2e9817875a48ba45139b7f93502ad28f13e238840a506d1be7d5b8361b344d25",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 3001,
        "tempC": 72,
        "smClockMhz": 1755,
        "powerDrawW": 98.7
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 3001,
        "tempC": 72,
        "smClockMhz": 1755,
        "powerDrawW": 102.92
      }
    }
  ],
  "errors": [],
  "uploadEligible": true
}