{
  "evidenceVersion": "local-ollama-speed-v1",
  "capturedAt": "2026-06-02T01:31:47.974Z",
  "hardwareSlug": "rtx-3080-16gb-mobile",
  "modelTag": "deepseek-coder-v2:16b",
  "catalogSlug": "deepseek-coder-v2-lite",
  "quant": "Q4_K_M",
  "contextSize": 4096,
  "numPredict": 256,
  "prompt": "Write a detailed explanation of how transformer attention works.",
  "scenario": "single-stream",
  "runtime": "ollama-api",
  "command": "POST http://localhost:11434/api/generate model=deepseek-coder-v2:16b temperature=0 top_p=1 seed=42 num_ctx=4096 num_predict=256",
  "env": {
    "os": "Microsoft Windows [Version 10.0.26200.8457]",
    "platform": "win32",
    "arch": "x64",
    "cpu": "AMD Ryzen 9 5900HX with Radeon Graphics        ",
    "cpuThreads": 16,
    "ramGb": 31.9,
    "gpu": {
      "vendor": "nvidia",
      "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
      "driver": "571.96",
      "memoryTotalMb": 16384,
      "memoryUsedMb": 1798,
      "tempC": 57,
      "smClockMhz": 420,
      "powerDrawW": 20.34
    },
    "ollamaVersionCli": "ollama version is 0.24.0",
    "ollamaApiVersion": {
      "version": "0.24.0"
    }
  },
  "ollamaTagDetails": {
    "name": "deepseek-coder-v2:16b",
    "model": "deepseek-coder-v2:16b",
    "modified_at": "2026-06-02T04:31:26.5558339+03:00",
    "size": 8905126121,
    "digest": "63fb193b3a9b4322a18e8c6b250ca2e70a5ff531e962dbf95ba089b2566f2fa5",
    "details": {
      "parent_model": "",
      "format": "gguf",
      "family": "deepseek2",
      "families": [
        "deepseek2"
      ],
      "parameter_size": "15.7B",
      "quantization_level": "Q4_0"
    }
  },
  "notes": null,
  "logHashSha256": "c00ed800cd1ccfe6362c7f119ba4fea42763a45ab89e497f9699febc08e560d0",
  "runsCaptured": 5,
  "decodeStatsAllRuns": {
    "min": 149.63257604052797,
    "max": 152.72729789256613,
    "median": 151.6908672854232,
    "p5": 149.95260621319892,
    "p95": 152.6564597100346,
    "mean": 151.53131502046168,
    "n": 5
  },
  "decodeStatsSteadyRuns": {
    "min": 149.63257604052797,
    "max": 152.72729789256613,
    "median": 152.03198713266585,
    "p5": 149.94131972726225,
    "p95": 152.67416925566746,
    "mean": 151.60596204960643,
    "n": 4
  },
  "runs": [
    {
      "runIndex": 1,
      "startedAt": "2026-06-02T01:31:31.301Z",
      "finishedAt": "2026-06-02T01:31:38.131Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run1.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run1.log",
      "decodeTokPerSec": 151.23272690388268,
      "prefillTokPerSec": 266.9007485083214,
      "totalMs": 6737.0783,
      "loadMs": 4589.1177,
      "promptEvalMs": 67.4408,
      "evalMs": 1692.7553,
      "promptTokens": 18,
      "responseTokens": 256,
      "responseHashSha256": "fffa8f3d334ef684e41bc0cf4ece79fad13b6bea679d9db9ea6f75a2c44fb121",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 1798,
        "tempC": 57,
        "smClockMhz": 420,
        "powerDrawW": 16.57
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11761,
        "tempC": 63,
        "smClockMhz": 1620,
        "powerDrawW": 110.59
      }
    },
    {
      "runIndex": 2,
      "startedAt": "2026-06-02T01:31:38.208Z",
      "finishedAt": "2026-06-02T01:31:40.582Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run2.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run2.log",
      "decodeTokPerSec": 149.63257604052797,
      "prefillTokPerSec": 1556.0704035409246,
      "totalMs": 2289.6945,
      "loadMs": 185.6832,
      "promptEvalMs": 11.5676,
      "evalMs": 1710.8574,
      "promptTokens": 18,
      "responseTokens": 256,
      "responseHashSha256": "862271f9476a54f38957c8ff2c37d0218bfc6a24b0e75fdd63245f7d6f8dd259",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11761,
        "tempC": 61,
        "smClockMhz": 1620,
        "powerDrawW": 103.94
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11761,
        "tempC": 64,
        "smClockMhz": 1740,
        "powerDrawW": 114.48
      }
    },
    {
      "runIndex": 3,
      "startedAt": "2026-06-02T01:31:40.658Z",
      "finishedAt": "2026-06-02T01:31:43.053Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run3.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run3.log",
      "decodeTokPerSec": 152.37310697990847,
      "prefillTokPerSec": 1545.595054095827,
      "totalMs": 2293.9322,
      "loadMs": 204.6297,
      "promptEvalMs": 11.646,
      "evalMs": 1680.0865,
      "promptTokens": 18,
      "responseTokens": 256,
      "responseHashSha256": "862271f9476a54f38957c8ff2c37d0218bfc6a24b0e75fdd63245f7d6f8dd259",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11761,
        "tempC": 64,
        "smClockMhz": 1740,
        "powerDrawW": 108.75
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11761,
        "tempC": 65,
        "smClockMhz": 1590,
        "powerDrawW": 112.26
      }
    },
    {
      "runIndex": 4,
      "startedAt": "2026-06-02T01:31:43.128Z",
      "finishedAt": "2026-06-02T01:31:45.519Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run4.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run4.log",
      "decodeTokPerSec": 152.72729789256613,
      "prefillTokPerSec": 1523.6805349811657,
      "totalMs": 2301.8085,
      "loadMs": 203.9763,
      "promptEvalMs": 11.8135,
      "evalMs": 1676.1902,
      "promptTokens": 18,
      "responseTokens": 256,
      "responseHashSha256": "862271f9476a54f38957c8ff2c37d0218bfc6a24b0e75fdd63245f7d6f8dd259",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11761,
        "tempC": 65,
        "smClockMhz": 1590,
        "powerDrawW": 105.43
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11761,
        "tempC": 65,
        "smClockMhz": 1575,
        "powerDrawW": 111.03
      }
    },
    {
      "runIndex": 5,
      "startedAt": "2026-06-02T01:31:45.597Z",
      "finishedAt": "2026-06-02T01:31:47.972Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run5.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-02/deepseek-coder-v2-16b/run5.log",
      "decodeTokPerSec": 151.6908672854232,
      "prefillTokPerSec": 1579.6956453056712,
      "totalMs": 2289.1281,
      "loadMs": 194.3083,
      "promptEvalMs": 11.3946,
      "evalMs": 1687.6428,
      "promptTokens": 18,
      "responseTokens": 256,
      "responseHashSha256": "862271f9476a54f38957c8ff2c37d0218bfc6a24b0e75fdd63245f7d6f8dd259",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11761,
        "tempC": 65,
        "smClockMhz": 1575,
        "powerDrawW": 111.03
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 11761,
        "tempC": 66,
        "smClockMhz": 1560,
        "powerDrawW": 114.42
      }
    }
  ],
  "errors": [],
  "uploadEligible": true
}