{
  "evidenceVersion": "local-ollama-speed-v1",
  "capturedAt": "2026-06-02T01:22:05.349Z",
  "hardwareSlug": "rtx-3080-16gb-mobile",
  "modelTag": "qwen3:14b",
  "catalogSlug": "qwen-3-14b",
  "quant": "Q4_K_M",
  "contextSize": 4096,
  "numPredict": 256,
  "prompt": "Write a detailed explanation of how transformer attention works.",
  "scenario": "single-stream",
  "runtime": "ollama-api",
  "command": "POST http://localhost:11434/api/generate model=qwen3:14b temperature=0 top_p=1 seed=42 num_ctx=4096 num_predict=256",
  "env": {
    "os": "Microsoft Windows [Version 10.0.26200.8457]",
    "platform": "win32",
    "arch": "x64",
    "cpu": "AMD Ryzen 9 5900HX with Radeon Graphics        ",
    "cpuThreads": 16,
    "ramGb": 31.9,
    "gpu": {
      "vendor": "nvidia",
      "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
      "driver": "571.96",
      "memoryTotalMb": 16384,
      "memoryUsedMb": 1798,
      "tempC": 54,
      "smClockMhz": 420,
      "powerDrawW": 19.49
    },
    "ollamaVersionCli": "ollama version is 0.24.0",
    "ollamaApiVersion": {
      "version": "0.24.0"
    }
  },
  "ollamaTagDetails": {
    "name": "qwen3:14b",
    "model": "qwen3:14b",
    "modified_at": "2026-06-02T04:21:17.9455981+03:00",
    "size": 9276198565,
    "digest": "bdbd181c33f2ed1b31c972991882db3cf4d192569092138a7d29e973cd9debe8",
    "details": {
      "parent_model": "",
      "format": "gguf",
      "family": "qwen3",
      "families": [
        "qwen3"
      ],
      "parameter_size": "14.8B",
      "quantization_level": "Q4_K_M"
    }
  },
  "notes": null,
  "logHashSha256": "5fbefd9f5b3006ae0a7ea616e35480fdec8723bfe9e37a6f5e0bd5743f13a274",
  "runsCaptured": 5,
  "decodeStatsAllRuns": {
    "min": 38.14841482830673,
    "max": 38.79836904387254,
    "median": 38.28482145462252,
    "p5": 38.16574798799193,
    "p95": 38.73301632870511,
    "mean": 38.38765828431398,
    "n": 5
  },
  "decodeStatsSteadyRuns": {
    "min": 38.14841482830673,
    "max": 38.471605468035406,
    "median": 38.25995104067762,
    "p5": 38.16141469807062,
    "p95": 38.44358786602347,
    "mean": 38.28498059442434,
    "n": 4
  },
  "runs": [
    {
      "runIndex": 1,
      "startedAt": "2026-06-02T01:21:23.207Z",
      "finishedAt": "2026-06-02T01:21:36.020Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run1.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run1.log",
      "decodeTokPerSec": 38.79836904387254,
      "prefillTokPerSec": 258.63919573555694,
      "totalMs": 12705.8214,
      "loadMs": 5811.4636,
      "promptEvalMs": 77.3278,
      "evalMs": 6598.2155,
      "promptTokens": 20,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 1798,
        "tempC": 54,
        "smClockMhz": 420,
        "powerDrawW": 14.68
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11289,
        "tempC": 61,
        "smClockMhz": 1110,
        "powerDrawW": 114.42
      }
    },
    {
      "runIndex": 2,
      "startedAt": "2026-06-02T01:21:36.097Z",
      "finishedAt": "2026-06-02T01:21:43.358Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run2.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run2.log",
      "decodeTokPerSec": 38.471605468035406,
      "prefillTokPerSec": 706.1997274069051,
      "totalMs": 7147.8916,
      "loadMs": 304.1624,
      "promptEvalMs": 28.3206,
      "evalMs": 6654.2583,
      "promptTokens": 20,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11289,
        "tempC": 60,
        "smClockMhz": 1110,
        "powerDrawW": 108.32
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11289,
        "tempC": 63,
        "smClockMhz": 1140,
        "powerDrawW": 111.27
      }
    },
    {
      "runIndex": 3,
      "startedAt": "2026-06-02T01:21:43.454Z",
      "finishedAt": "2026-06-02T01:21:50.693Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run3.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run3.log",
      "decodeTokPerSec": 38.28482145462252,
      "prefillTokPerSec": 705.6167090036691,
      "totalMs": 7152.0829,
      "loadMs": 279.7678,
      "promptEvalMs": 28.344,
      "evalMs": 6686.7231,
      "promptTokens": 20,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11289,
        "tempC": 63,
        "smClockMhz": 1140,
        "powerDrawW": 104.49
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11289,
        "tempC": 65,
        "smClockMhz": 1155,
        "powerDrawW": 114.67
      }
    },
    {
      "runIndex": 4,
      "startedAt": "2026-06-02T01:21:50.765Z",
      "finishedAt": "2026-06-02T01:21:58.019Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run4.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run4.log",
      "decodeTokPerSec": 38.14841482830673,
      "prefillTokPerSec": 711.4197091716229,
      "totalMs": 7162.9409,
      "loadMs": 283.8441,
      "promptEvalMs": 28.1128,
      "evalMs": 6710.6327,
      "promptTokens": 20,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11289,
        "tempC": 65,
        "smClockMhz": 1770,
        "powerDrawW": 108.69
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11289,
        "tempC": 67,
        "smClockMhz": 1065,
        "powerDrawW": 114.44
      }
    },
    {
      "runIndex": 5,
      "startedAt": "2026-06-02T01:21:58.110Z",
      "finishedAt": "2026-06-02T01:22:05.348Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run5.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/qwen3-14b/run5.log",
      "decodeTokPerSec": 38.23508062673272,
      "prefillTokPerSec": 709.8315214883747,
      "totalMs": 7147.9903,
      "loadMs": 251.4656,
      "promptEvalMs": 28.1757,
      "evalMs": 6695.422,
      "promptTokens": 20,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11289,
        "tempC": 66,
        "smClockMhz": 1065,
        "powerDrawW": 110.33
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11289,
        "tempC": 69,
        "smClockMhz": 1125,
        "powerDrawW": 112.55
      }
    }
  ],
  "errors": [],
  "uploadEligible": true
}