{
  "evidenceVersion": "local-ollama-speed-v1",
  "capturedAt": "2026-06-01T23:58:54.524Z",
  "hardwareSlug": "rtx-3080-16gb-mobile",
  "modelTag": "llama3.2-vision:11b",
  "catalogSlug": "llama-3.2-11b-vision-instruct",
  "quant": "Q4_K_M",
  "contextSize": 4096,
  "numPredict": 256,
  "prompt": "Write a detailed explanation of how transformer attention works.",
  "scenario": "single-stream",
  "runtime": "ollama-api",
  "command": "POST http://localhost:11434/api/generate model=llama3.2-vision:11b temperature=0 top_p=1 seed=42 num_ctx=4096 num_predict=256",
  "env": {
    "os": "Microsoft Windows [Version 10.0.26200.8457]",
    "platform": "win32",
    "arch": "x64",
    "cpu": "AMD Ryzen 9 5900HX with Radeon Graphics        ",
    "cpuThreads": 16,
    "ramGb": 31.9,
    "gpu": {
      "vendor": "nvidia",
      "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
      "driver": "571.96",
      "memoryTotalMb": 16384,
      "memoryUsedMb": 1859,
      "tempC": 53,
      "smClockMhz": 210,
      "powerDrawW": 11.68
    },
    "ollamaVersionCli": "ollama version is 0.24.0",
    "ollamaApiVersion": {
      "version": "0.24.0"
    }
  },
  "ollamaTagDetails": {
    "name": "llama3.2-vision:11b",
    "model": "llama3.2-vision:11b",
    "modified_at": "2026-06-02T02:58:21.3317937+03:00",
    "size": 7816589186,
    "digest": "6f2f9757ae97e8a3f8ea33d6adb2b11d93d9a35bef277cd2c0b1b5af8e8d0b1e",
    "details": {
      "parent_model": "",
      "format": "gguf",
      "family": "mllama",
      "families": [
        "mllama"
      ],
      "parameter_size": "10.7B",
      "quantization_level": "Q4_K_M"
    }
  },
  "notes": null,
  "logHashSha256": "11ac2c921fad5de0229df8ce26154a4431aa56ed8c5804a22b525cd4b087141d",
  "runsCaptured": 5,
  "decodeStatsAllRuns": {
    "min": 66.99679862602129,
    "max": 67.2148898624954,
    "median": 67.01161243184775,
    "p5": 66.99730922043142,
    "p95": 67.19415007442888,
    "mean": 67.06676868811985,
    "n": 5
  },
  "decodeStatsSteadyRuns": {
    "min": 66.99679862602129,
    "max": 67.11119092216282,
    "median": 67.00548201495985,
    "p5": 66.99718157182889,
    "p95": 67.09625414861556,
    "mean": 67.02973839452596,
    "n": 4
  },
  "runs": [
    {
      "runIndex": 1,
      "startedAt": "2026-06-01T23:58:25.693Z",
      "finishedAt": "2026-06-01T23:58:36.336Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run1.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run1.log",
      "decodeTokPerSec": 67.2148898624954,
      "prefillTokPerSec": 92.26696036696998,
      "totalMs": 10505.1345,
      "loadMs": 6304.6103,
      "promptEvalMs": 205.9242,
      "evalMs": 3808.6799,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "84c2cd8080cd446a30b208663725a948def923e6eed42ffa57c86708d849c643",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 1859,
        "tempC": 53,
        "smClockMhz": 210,
        "powerDrawW": 11.64
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 13148,
        "tempC": 60,
        "smClockMhz": 1245,
        "powerDrawW": 113.96
      }
    },
    {
      "runIndex": 2,
      "startedAt": "2026-06-01T23:58:36.410Z",
      "finishedAt": "2026-06-01T23:58:40.883Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run2.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run2.log",
      "decodeTokPerSec": 67.11119092216282,
      "prefillTokPerSec": 1027.3546698676876,
      "totalMs": 4376.7393,
      "loadMs": 402.1887,
      "promptEvalMs": 18.4941,
      "evalMs": 3814.565,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "ebcdf5ce4841c4cff333865f929415e9182e9ac319c031fd0601c79ba548e117",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 13148,
        "tempC": 60,
        "smClockMhz": 1245,
        "powerDrawW": 107.06
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 13148,
        "tempC": 61,
        "smClockMhz": 1320,
        "powerDrawW": 113.43
      }
    },
    {
      "runIndex": 3,
      "startedAt": "2026-06-01T23:58:40.970Z",
      "finishedAt": "2026-06-01T23:58:45.459Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run3.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run3.log",
      "decodeTokPerSec": 67.01161243184775,
      "prefillTokPerSec": 1067.8056593699946,
      "totalMs": 4380.4932,
      "loadMs": 398.3986,
      "promptEvalMs": 17.7935,
      "evalMs": 3820.2334,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "ebcdf5ce4841c4cff333865f929415e9182e9ac319c031fd0601c79ba548e117",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 13148,
        "tempC": 60,
        "smClockMhz": 1320,
        "powerDrawW": 106.58
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 13148,
        "tempC": 61,
        "smClockMhz": 1305,
        "powerDrawW": 111.06
      }
    },
    {
      "runIndex": 4,
      "startedAt": "2026-06-01T23:58:45.536Z",
      "finishedAt": "2026-06-01T23:58:49.990Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run4.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run4.log",
      "decodeTokPerSec": 66.99935159807194,
      "prefillTokPerSec": 1077.1341428846786,
      "totalMs": 4372.7223,
      "loadMs": 387.8882,
      "promptEvalMs": 17.6394,
      "evalMs": 3820.9325,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "ebcdf5ce4841c4cff333865f929415e9182e9ac319c031fd0601c79ba548e117",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 13148,
        "tempC": 61,
        "smClockMhz": 1305,
        "powerDrawW": 104.11
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 13148,
        "tempC": 64,
        "smClockMhz": 1230,
        "powerDrawW": 114.6
      }
    },
    {
      "runIndex": 5,
      "startedAt": "2026-06-01T23:58:50.070Z",
      "finishedAt": "2026-06-01T23:58:54.522Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run5.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/llama3-2-vision-11b/run5.log",
      "decodeTokPerSec": 66.99679862602129,
      "prefillTokPerSec": 1051.8041208578293,
      "totalMs": 4366.4528,
      "loadMs": 383.4172,
      "promptEvalMs": 18.0642,
      "evalMs": 3821.0781,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "ebcdf5ce4841c4cff333865f929415e9182e9ac319c031fd0601c79ba548e117",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 13148,
        "tempC": 64,
        "smClockMhz": 1230,
        "powerDrawW": 108.3
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 13148,
        "tempC": 65,
        "smClockMhz": 1305,
        "powerDrawW": 114.53
      }
    }
  ],
  "errors": [],
  "uploadEligible": true
}