{
  "evidenceVersion": "local-ollama-speed-v1",
  "capturedAt": "2026-06-01T23:35:23.957Z",
  "hardwareSlug": "rtx-3080-16gb-mobile",
  "modelTag": "alibayram/turkish-gemma-9b-v0.1:latest",
  "catalogSlug": "ytu-turkish-gemma-9b",
  "quant": "Q4_K_M",
  "contextSize": 4096,
  "numPredict": 256,
  "prompt": "Write a detailed explanation of how transformer attention works.",
  "scenario": "single-stream",
  "runtime": "ollama-api",
  "command": "POST http://localhost:11434/api/generate model=alibayram/turkish-gemma-9b-v0.1:latest temperature=0 top_p=1 seed=42 num_ctx=4096 num_predict=256",
  "env": {
    "os": "Microsoft Windows [Version 10.0.26200.8457]",
    "platform": "win32",
    "arch": "x64",
    "cpu": "AMD Ryzen 9 5900HX with Radeon Graphics        ",
    "cpuThreads": 16,
    "ramGb": 31.9,
    "gpu": {
      "vendor": "nvidia",
      "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
      "driver": "571.96",
      "memoryTotalMb": 16384,
      "memoryUsedMb": 1869,
      "tempC": 54,
      "smClockMhz": 210,
      "powerDrawW": 11.85
    },
    "ollamaVersionCli": "ollama version is 0.24.0",
    "ollamaApiVersion": {
      "version": "0.24.0"
    }
  },
  "ollamaTagDetails": {
    "name": "alibayram/turkish-gemma-9b-v0.1:latest",
    "model": "alibayram/turkish-gemma-9b-v0.1:latest",
    "modified_at": "2026-06-02T02:34:46.5331358+03:00",
    "size": 5761058919,
    "digest": "c51ed67b59a4b44b3dacc0b1a192f35084d677df50694780a9a415c80c13d51b",
    "details": {
      "parent_model": "",
      "format": "gguf",
      "family": "gemma2",
      "families": [
        "gemma2"
      ],
      "parameter_size": "9.2B",
      "quantization_level": "Q4_K_M"
    }
  },
  "notes": null,
  "logHashSha256": "8ac298362c2b588acc5385742377f19b79107e4559c29da03465a044c5ffbe63",
  "runsCaptured": 5,
  "decodeStatsAllRuns": {
    "min": 65.64050724932736,
    "max": 66.91350780891091,
    "median": 66.22710324021536,
    "p5": 65.66584799876675,
    "p95": 66.85336426777963,
    "mean": 66.2322238796465,
    "n": 5
  },
  "decodeStatsSteadyRuns": {
    "min": 65.64050724932736,
    "max": 66.91350780891091,
    "median": 65.99715711836984,
    "p5": 65.6595128114069,
    "p95": 66.81054712360657,
    "mean": 66.1370823237445,
    "n": 4
  },
  "runs": [
    {
      "runIndex": 1,
      "startedAt": "2026-06-01T23:34:50.791Z",
      "finishedAt": "2026-06-01T23:35:00.918Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run1.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run1.log",
      "decodeTokPerSec": 66.61279010325451,
      "prefillTokPerSec": 354.22780203513196,
      "totalMs": 10030.0612,
      "loadMs": 4764.1451,
      "promptEvalMs": 53.6378,
      "evalMs": 3843.1058,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "e0676d087f2447dbff667cedc5d52422b012456d07be92e779a5b93c75001830",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 1869,
        "tempC": 54,
        "smClockMhz": 210,
        "powerDrawW": 11.85
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 9456,
        "tempC": 61,
        "smClockMhz": 1350,
        "powerDrawW": 112.02
      }
    },
    {
      "runIndex": 2,
      "startedAt": "2026-06-01T23:35:00.993Z",
      "finishedAt": "2026-06-01T23:35:06.666Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run2.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run2.log",
      "decodeTokPerSec": 66.22710324021536,
      "prefillTokPerSec": 1134.1929321872014,
      "totalMs": 5572.388,
      "loadMs": 357.5314,
      "promptEvalMs": 16.752,
      "evalMs": 3865.4869,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "3ed6adf61a1e81dfadab5b65c2fbcf32ac869f6104c44c1a34b5b25fcb134bd6",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 9456,
        "tempC": 61,
        "smClockMhz": 1350,
        "powerDrawW": 104.86
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 9456,
        "tempC": 63,
        "smClockMhz": 1350,
        "powerDrawW": 114.54
      }
    },
    {
      "runIndex": 3,
      "startedAt": "2026-06-01T23:35:06.745Z",
      "finishedAt": "2026-06-01T23:35:12.418Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run3.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run3.log",
      "decodeTokPerSec": 65.76721099652431,
      "prefillTokPerSec": 1172.4921011058452,
      "totalMs": 5588.7849,
      "loadMs": 331.1946,
      "promptEvalMs": 16.2048,
      "evalMs": 3892.5172,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "3ed6adf61a1e81dfadab5b65c2fbcf32ac869f6104c44c1a34b5b25fcb134bd6",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 9456,
        "tempC": 63,
        "smClockMhz": 1350,
        "powerDrawW": 107.87
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 9456,
        "tempC": 64,
        "smClockMhz": 1350,
        "powerDrawW": 113.12
      }
    },
    {
      "runIndex": 4,
      "startedAt": "2026-06-01T23:35:12.492Z",
      "finishedAt": "2026-06-01T23:35:18.168Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run4.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run4.log",
      "decodeTokPerSec": 66.91350780891091,
      "prefillTokPerSec": 1135.9831635337446,
      "totalMs": 5586.9355,
      "loadMs": 347.3633,
      "promptEvalMs": 16.7256,
      "evalMs": 3825.8344,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "3ed6adf61a1e81dfadab5b65c2fbcf32ac869f6104c44c1a34b5b25fcb134bd6",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 9456,
        "tempC": 64,
        "smClockMhz": 1350,
        "powerDrawW": 106.28
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 9456,
        "tempC": 66,
        "smClockMhz": 1350,
        "powerDrawW": 114.98
      }
    },
    {
      "runIndex": 5,
      "startedAt": "2026-06-01T23:35:18.246Z",
      "finishedAt": "2026-06-01T23:35:23.956Z",
      "rawPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run5.ollama.json",
      "logPath": "public/benchmarks/evidence/local-ollama-rtx-3080-16gb-mobile-2026-06-01/alibayram-turkish-gemma-9b-v0-1-latest/run5.log",
      "decodeTokPerSec": 65.64050724932736,
      "prefillTokPerSec": 1170.592258072466,
      "totalMs": 5606.8539,
      "loadMs": 369.3599,
      "promptEvalMs": 16.2311,
      "evalMs": 3900.0308,
      "promptTokens": 19,
      "responseTokens": 256,
      "responseHashSha256": "3ed6adf61a1e81dfadab5b65c2fbcf32ac869f6104c44c1a34b5b25fcb134bd6",
      "beforeGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 9456,
        "tempC": 66,
        "smClockMhz": 1350,
        "powerDrawW": 109.61
      },
      "afterGpu": {
        "vendor": "nvidia",
        "name": "NVIDIA GeForce RTX 3080 Laptop GPU",
        "driver": "571.96",
        "memoryTotalMb": 16384,
        "memoryUsedMb": 9456,
        "tempC": 67,
        "smClockMhz": 1335,
        "powerDrawW": 114.84
      }
    }
  ],
  "errors": [],
  "uploadEligible": true
}