{
  "evidenceVersion": "local-ollama-speed-v1",
  "capturedAt": "2026-06-01T22:06:51.356Z",
  "hardwareSlug": "rtx-3080-16gb-mobile",
  "modelTag": "koezgen/malhajar-mistral-tur7b:latest",
  "catalogSlug": "mistral-7b-turkish",
  "quant": "Q4_K_M",
  "contextSize": 4096,
  "numPredict": 256,
  "prompt": "Write a detailed explanation of how transformer attention works.",
  "scenario": "single-stream",
  "runtime": "ollama-api",
  "command": "POST http://localhost:11434/api/generate model=koezgen/malhajar-mistral-tur7b:latest temperature=0 top_p=1 seed=42 num_ctx=4096 num_predict=256",
  "env": {
    "os": "Microsoft Windows [Version 10.0.26200.8457]",
    "platform": "win32",
    "arch": "x64",
    "cpu": "AMD Ryzen 9 5900HX with Radeon Graphics        ",
    "cpuThreads": 16,
    "ramGb": 31.9,
    "gpu": {
      "vendor": "nvidia",
      "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
      "driver": "571.96",
      "memoryTotalMb": 16384,
      "memoryUsedMb": 1881,
      "tempC": 58,
      "smClockMhz": 210,
      "powerDrawW": 17.19
    },
    "ollamaVersionCli": "ollama version is 0.24.0",
    "ollamaApiVersion": {
      "version": "0.24.0"
    }
  },
  "ollamaTagDetails": {
    "name": "koezgen/malhajar-mistral-tur7b:latest",
    "model": "koezgen/malhajar-mistral-tur7b:latest",
    "modified_at": "2026-06-02T01:06:20.6141546+03:00",
    "size": 5131410854,
    "digest": "45c41d844f56b1359a75a03748dee3fc4897398946d31e28d0c4372381193caa",
    "details": {
      "parent_model": "",
      "format": "gguf",
      "family": "llama",
      "families": [
        "llama"
      ],
      "parameter_size": "7.2B",
      "quantization_level": "Q5_K_M"
    }
  },
  "notes": null,
  "logHashSha256": "c1e1f2596f203477d7b29c2a2ac0a78accc62cb736acab90a862a143605f6efc",
  "runsCaptured": 5,
  "decodeStatsAllRuns": {
    "min": 81.9681526831026,
    "max": 89.92529982622989,
    "median": 86.70103933886935,
    "p5": 82.17788955584894,
    "p95": 89.50937319965661,
    "mean": 85.89139911767992,
    "n": 5
  },
  "decodeStatsSteadyRuns": {
    "min": 81.9681526831026,
    "max": 89.92529982622989,
    "median": 87.27335301611643,
    "p5": 82.67808568146762,
    "p95": 89.61335485629994,
    "mean": 86.61003963539133,
    "n": 4
  },
  "runs": [
    {
      "runIndex": 1,
      "startedAt": "2026-06-01T22:06:26.353Z",
      "finishedAt": "2026-06-01T22:06:34.618Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run1.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run1.log",
      "decodeTokPerSec": 83.01683704683427,
      "prefillTokPerSec": 1747.998426801416,
      "totalMs": 8175.9482,
      "loadMs": 4210.0343,
      "promptEvalMs": 43.4783,
      "evalMs": 3083.7118,
      "promptTokens": 76,
      "responseTokens": 256,
      "responseHashSha256": "21ca1499c2b997338c9f0fb403ed5d520348b297e780331d5425657c931a3bd4",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 1881,
        "tempC": 58,
        "smClockMhz": 210,
        "powerDrawW": 17.13
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 7572,
        "tempC": 64,
        "smClockMhz": 1740,
        "powerDrawW": 110.31
      }
    },
    {
      "runIndex": 2,
      "startedAt": "2026-06-01T22:06:34.695Z",
      "finishedAt": "2026-06-01T22:06:38.793Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run2.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run2.log",
      "decodeTokPerSec": 81.9681526831026,
      "prefillTokPerSec": 4876.483798524222,
      "totalMs": 3999.8207,
      "loadMs": 56.3054,
      "promptEvalMs": 15.585,
      "evalMs": 3123.1642,
      "promptTokens": 76,
      "responseTokens": 256,
      "responseHashSha256": "66a41e9f7d92e045be594fb3360f76005ad49b1fea05ca06e4c67ec8e0127dcc",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 7572,
        "tempC": 64,
        "smClockMhz": 1740,
        "powerDrawW": 110.31
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 7572,
        "tempC": 66,
        "smClockMhz": 1155,
        "powerDrawW": 114.47
      }
    },
    {
      "runIndex": 3,
      "startedAt": "2026-06-01T22:06:38.866Z",
      "finishedAt": "2026-06-01T22:06:42.963Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run3.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run3.log",
      "decodeTokPerSec": 86.70103933886935,
      "prefillTokPerSec": 4493.983384087751,
      "totalMs": 4013.7825,
      "loadMs": 59.8711,
      "promptEvalMs": 16.9115,
      "evalMs": 2952.6751,
      "promptTokens": 76,
      "responseTokens": 256,
      "responseHashSha256": "66a41e9f7d92e045be594fb3360f76005ad49b1fea05ca06e4c67ec8e0127dcc",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 7572,
        "tempC": 66,
        "smClockMhz": 1155,
        "powerDrawW": 108.25
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 7572,
        "tempC": 67,
        "smClockMhz": 1110,
        "powerDrawW": 113.91
      }
    },
    {
      "runIndex": 4,
      "startedAt": "2026-06-01T22:06:43.038Z",
      "finishedAt": "2026-06-01T22:06:47.152Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run4.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run4.log",
      "decodeTokPerSec": 87.84566669336351,
      "prefillTokPerSec": 4945.534052604865,
      "totalMs": 4020.1916,
      "loadMs": 53.9704,
      "promptEvalMs": 15.3674,
      "evalMs": 2914.2018,
      "promptTokens": 76,
      "responseTokens": 256,
      "responseHashSha256": "66a41e9f7d92e045be594fb3360f76005ad49b1fea05ca06e4c67ec8e0127dcc",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 7572,
        "tempC": 67,
        "smClockMhz": 1110,
        "powerDrawW": 107.33
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 7572,
        "tempC": 68,
        "smClockMhz": 1560,
        "powerDrawW": 112.48
      }
    },
    {
      "runIndex": 5,
      "startedAt": "2026-06-01T22:06:47.226Z",
      "finishedAt": "2026-06-01T22:06:51.355Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run5.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/koezgen-malhajar-mistral-tur7b-latest/run5.log",
      "decodeTokPerSec": 89.92529982622989,
      "prefillTokPerSec": 5108.522494303325,
      "totalMs": 4039.8778,
      "loadMs": 66.3774,
      "promptEvalMs": 14.8771,
      "evalMs": 2846.8073,
      "promptTokens": 76,
      "responseTokens": 256,
      "responseHashSha256": "66a41e9f7d92e045be594fb3360f76005ad49b1fea05ca06e4c67ec8e0127dcc",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 7572,
        "tempC": 68,
        "smClockMhz": 1560,
        "powerDrawW": 106.11
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 7572,
        "tempC": 69,
        "smClockMhz": 1080,
        "powerDrawW": 113.27
      }
    }
  ],
  "errors": [],
  "uploadEligible": true
}