{
  "evidenceVersion": "local-ollama-speed-v1",
  "capturedAt": "2026-06-01T21:50:31.658Z",
  "hardwareSlug": "rtx-3080-16gb-mobile",
  "modelTag": "deepseek-r1:7b",
  "catalogSlug": "deepseek-r1-distill-qwen-7b",
  "quant": "Q4_K_M",
  "contextSize": 4096,
  "numPredict": 256,
  "prompt": "Write a detailed explanation of how transformer attention works.",
  "scenario": "single-stream",
  "runtime": "ollama-api",
  "command": "POST http://localhost:11434/api/generate model=deepseek-r1:7b temperature=0 top_p=1 seed=42 num_ctx=4096 num_predict=256",
  "env": {
    "os": "Microsoft Windows [Version 10.0.26200.8457]",
    "platform": "win32",
    "arch": "x64",
    "cpu": "AMD Ryzen 9 5900HX with Radeon Graphics        ",
    "cpuThreads": 16,
    "ramGb": 31.9,
    "gpu": {
      "vendor": "nvidia",
      "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
      "driver": "571.96",
      "memoryTotalMb": 16384,
      "memoryUsedMb": 1873,
      "tempC": 61,
      "smClockMhz": 210,
      "powerDrawW": 17.77
    },
    "ollamaVersionCli": "ollama version is 0.24.0",
    "ollamaApiVersion": {
      "version": "0.24.0"
    }
  },
  "ollamaTagDetails": {
    "name": "deepseek-r1:7b",
    "model": "deepseek-r1:7b",
    "modified_at": "2026-06-02T00:50:03.0280671+03:00",
    "size": 4683075440,
    "digest": "755ced02ce7befdb13b7ca74e1e4d08cddba4986afdb63a480f2c93d3140383f",
    "details": {
      "parent_model": "",
      "format": "gguf",
      "family": "qwen2",
      "families": [
        "qwen2"
      ],
      "parameter_size": "7.6B",
      "quantization_level": "Q4_K_M"
    }
  },
  "notes": null,
  "logHashSha256": "edf2129e7a124166b750c14a49300b2cc84f5a02ebaa9821b6efd5cf25caa6ac",
  "runsCaptured": 5,
  "decodeStatsAllRuns": {
    "min": 79.32732903953506,
    "max": 81.76871610051892,
    "median": 80.34115616635478,
    "p5": 79.42809813741619,
    "p95": 81.55575021836023,
    "mean": 80.394452505015,
    "n": 5
  },
  "decodeStatsSteadyRuns": {
    "min": 79.32732903953506,
    "max": 81.76871610051892,
    "median": 80.26753060933311,
    "p5": 79.40290586294591,
    "p95": 81.6089916888999,
    "mean": 80.40777658968005,
    "n": 4
  },
  "runs": [
    {
      "runIndex": 1,
      "startedAt": "2026-06-01T21:50:07.203Z",
      "finishedAt": "2026-06-01T21:50:14.420Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run1.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run1.log",
      "decodeTokPerSec": 80.34115616635478,
      "prefillTokPerSec": 468.5832924824822,
      "totalMs": 7142.7146,
      "loadMs": 3302.3779,
      "promptEvalMs": 27.7432,
      "evalMs": 3186.4117,
      "promptTokens": 13,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 1873,
        "tempC": 61,
        "smClockMhz": 210,
        "powerDrawW": 17.77
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 6818,
        "tempC": 67,
        "smClockMhz": 1230,
        "powerDrawW": 111.29
      }
    },
    {
      "runIndex": 2,
      "startedAt": "2026-06-01T21:50:14.501Z",
      "finishedAt": "2026-06-01T21:50:18.717Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run2.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run2.log",
      "decodeTokPerSec": 81.76871610051892,
      "prefillTokPerSec": 891.8403468572918,
      "totalMs": 4123.9006,
      "loadMs": 285.8791,
      "promptEvalMs": 14.5766,
      "evalMs": 3130.7817,
      "promptTokens": 13,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 6818,
        "tempC": 67,
        "smClockMhz": 1770,
        "powerDrawW": 111.29
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 6818,
        "tempC": 68,
        "smClockMhz": 1245,
        "powerDrawW": 110.35
      }
    },
    {
      "runIndex": 3,
      "startedAt": "2026-06-01T21:50:18.796Z",
      "finishedAt": "2026-06-01T21:50:23.032Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run3.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run3.log",
      "decodeTokPerSec": 79.32732903953506,
      "prefillTokPerSec": 828.8120573027905,
      "totalMs": 4149.7936,
      "loadMs": 297.7214,
      "promptEvalMs": 15.6851,
      "evalMs": 3227.135,
      "promptTokens": 13,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 6818,
        "tempC": 67,
        "smClockMhz": 1245,
        "powerDrawW": 110.35
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 6818,
        "tempC": 69,
        "smClockMhz": 1215,
        "powerDrawW": 111.98
      }
    },
    {
      "runIndex": 4,
      "startedAt": "2026-06-01T21:50:23.109Z",
      "finishedAt": "2026-06-01T21:50:27.345Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run4.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run4.log",
      "decodeTokPerSec": 79.83117452894072,
      "prefillTokPerSec": 889.3084600597889,
      "totalMs": 4147.0777,
      "loadMs": 285.3947,
      "promptEvalMs": 14.6181,
      "evalMs": 3206.7673,
      "promptTokens": 13,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 6818,
        "tempC": 69,
        "smClockMhz": 1215,
        "powerDrawW": 105.71
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 6818,
        "tempC": 71,
        "smClockMhz": 1245,
        "powerDrawW": 112.58
      }
    },
    {
      "runIndex": 5,
      "startedAt": "2026-06-01T21:50:27.422Z",
      "finishedAt": "2026-06-01T21:50:31.656Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run5.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/deepseek-r1-7b/run5.log",
      "decodeTokPerSec": 80.7038866897255,
      "prefillTokPerSec": 894.0114983632712,
      "totalMs": 4149.6044,
      "loadMs": 273.343,
      "promptEvalMs": 14.5412,
      "evalMs": 3172.0901,
      "promptTokens": 13,
      "responseTokens": 256,
      "responseHashSha256": "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 6818,
        "tempC": 71,
        "smClockMhz": 1245,
        "powerDrawW": 106.23
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 6818,
        "tempC": 72,
        "smClockMhz": 1200,
        "powerDrawW": 113.6
      }
    }
  ],
  "errors": [],
  "uploadEligible": true
}