{
  "evidenceVersion": "local-ollama-tps-sweep-v1",
  "capturedAt": "2026-05-28T05:13:10.545Z",
  "evidenceUrl": "https://www.runlocalai.co/benchmarks/evidence/local-ollama-rtx-5080-2026-05-28-turkish-sweep/kumru-2b/evidence.json",
  "hardwareSlug": "rtx-5080",
  "hardwareLabel": "rtx-5080-16gb",
  "gpu": "NVIDIA GeForce RTX 5080 16GB",
  "runtime": "ollama-local-api",
  "scenario": "single-stream",
  "command": "POST http://localhost:11434/api/generate model=alibayram/kumru:latest temperature=0 seed=42 num_ctx=2048 num_predict=512",
  "contextSize": 2048,
  "numPredict": 512,
  "seed": 42,
  "temperature": 0,
  "promptSha256": "843f1934769f40e6972f520eafd20f336ef4fa86d7f50530aa03477d411084fa",
  "protocolNote": "Batch=1, 2048 context, 512 generated tokens, consecutive warm-model runs. Generation TPS uses Ollama eval_count/eval_duration.",
  "outputHash": "12c8d822940557b9a8381fcd5594d09e62b5ca1bcc036192447ba812eb8d688d",
  "sourceFileSha256": "897d20358d0a41bb640d93209207220980320a91618c1f3a18a382dbbe22e414",
  "sourceResultSha256": "6ffc8a6782bb9e94aa30524c89da9867d4caa5829a043f932e661c2d3b91d037",
  "artifactHashSha256": "a099071b5ad93fb33c56cefdfb50e3e7516800527fa4c3b7ca7c3e14033eaae0",
  "logHashSha256": "a099071b5ad93fb33c56cefdfb50e3e7516800527fa4c3b7ca7c3e14033eaae0",
  "logHashNote": "Structured Ollama API sweep hash. No separate verbose text logs were captured for this sweep.",
  "modelTag": "alibayram/kumru:latest",
  "catalogSlug": "kumru-2b",
  "family": "llama",
  "parameterSize": "2.4B",
  "quantizationLevel": "Q4_K_M",
  "modelSizeBytes": 1458559332,
  "digest": "04f3c85761dd4f928a33a739d47924674f2b034d511664213b3576934c7078e6",
  "isTurkishModel": true,
  "scoresGenerationTps": [
    446,
    397.42,
    443.66,
    406.67,
    454.33
  ],
  "statsGenerationTps": {
    "min": 397.42,
    "max": 454.33,
    "median": 443.66,
    "p5": 399.27000000000004,
    "p95": 452.664,
    "mean": 429.6160000000001,
    "stdev": 22.97630309688658,
    "cvPct": 5.348102281313213,
    "n": 5
  },
  "runsCaptured": 5,
  "runStatsJson": {
    "runs": [
      {
        "runIndex": 1,
        "tokPerSec": 446,
        "totalTokPerSec": 333.04,
        "ttftMs": null,
        "prefillTokPerSec": 6864.9443069306935,
        "promptTokens": 71,
        "responseTokens": 448,
        "promptEvalMs": 10.3424,
        "evalMs": 1004.4829,
        "totalMs": 1345.1708,
        "wallMs": 1351,
        "doneReason": "stop",
        "responseHash": "9c81ca4dbcb99536b8e68d42b6eae56a6c289da1221339bb9a0c9e5b119f147e"
      },
      {
        "runIndex": 2,
        "tokPerSec": 397.42,
        "totalTokPerSec": 322.56,
        "ttftMs": null,
        "prefillTokPerSec": 16443.940060680456,
        "promptTokens": 71,
        "responseTokens": 512,
        "promptEvalMs": 4.3177,
        "evalMs": 1288.2989,
        "totalMs": 1587.3004,
        "wallMs": 1594,
        "doneReason": "length",
        "responseHash": "155f9afef04b13be580019c31e47cd7e8ccf7eca4da219a033c1037301485ac0"
      },
      {
        "runIndex": 3,
        "tokPerSec": 443.66,
        "totalTokPerSec": 335.56,
        "ttftMs": null,
        "prefillTokPerSec": 18191.135024340252,
        "promptTokens": 71,
        "responseTokens": 512,
        "promptEvalMs": 3.903,
        "evalMs": 1154.0344,
        "totalMs": 1525.7866,
        "wallMs": 1531,
        "doneReason": "length",
        "responseHash": "155f9afef04b13be580019c31e47cd7e8ccf7eca4da219a033c1037301485ac0"
      },
      {
        "runIndex": 4,
        "tokPerSec": 406.67,
        "totalTokPerSec": 329.75,
        "ttftMs": null,
        "prefillTokPerSec": 21652.282638528864,
        "promptTokens": 71,
        "responseTokens": 512,
        "promptEvalMs": 3.2791,
        "evalMs": 1259.0028,
        "totalMs": 1552.698,
        "wallMs": 1557,
        "doneReason": "length",
        "responseHash": "155f9afef04b13be580019c31e47cd7e8ccf7eca4da219a033c1037301485ac0"
      },
      {
        "runIndex": 5,
        "tokPerSec": 454.33,
        "totalTokPerSec": 343.2,
        "ttftMs": null,
        "prefillTokPerSec": 22059.280432486175,
        "promptTokens": 71,
        "responseTokens": 512,
        "promptEvalMs": 3.2186,
        "evalMs": 1126.9321,
        "totalMs": 1491.8451,
        "wallMs": 1496,
        "doneReason": "length",
        "responseHash": "155f9afef04b13be580019c31e47cd7e8ccf7eca4da219a033c1037301485ac0"
      }
    ],
    "coldStart": null,
    "steady": {
      "min": 397.42,
      "max": 454.33,
      "median": 443.66,
      "p5": 399.27000000000004,
      "p95": 452.664,
      "mean": 429.6160000000001,
      "stdev": 22.97630309688658,
      "cvPct": 5.348102281313213,
      "n": 5
    },
    "warm": {
      "min": 397.42,
      "max": 454.33,
      "median": 443.66,
      "p5": 399.27000000000004,
      "p95": 452.664,
      "mean": 429.6160000000001,
      "stdev": 22.97630309688658,
      "cvPct": 5.348102281313213,
      "n": 5
    },
    "power": null,
    "accuracy": null,
    "env": {
      "hardware": "rtx-5080-16gb",
      "hardwareSlug": "rtx-5080",
      "gpu": "NVIDIA GeForce RTX 5080 16GB",
      "runtime": "ollama-local-api"
    },
    "protocol": {
      "benchmark": "yerelai-local-ollama-tps-sweep",
      "dimension": "tps",
      "sampleCount": 5,
      "contextLength": 2048,
      "numPredict": 512,
      "seed": 42,
      "temperature": 0,
      "promptSha256": "843f1934769f40e6972f520eafd20f336ef4fa86d7f50530aa03477d411084fa",
      "protocolNote": "Batch=1, 2048 context, 512 generated tokens, consecutive warm-model runs. Generation TPS uses Ollama eval_count/eval_duration.",
      "warmModelRuns": true,
      "batchSize": 1,
      "concurrency": 1
    },
    "model": {
      "tag": "alibayram/kumru:latest",
      "catalogSlug": "kumru-2b",
      "family": "llama",
      "parameterSize": "2.4B",
      "quantizationLevel": "Q4_K_M",
      "sizeBytes": 1458559332,
      "digest": "04f3c85761dd4f928a33a739d47924674f2b034d511664213b3576934c7078e6",
      "isTurkishModel": true
    },
    "evidenceUrl": "https://www.runlocalai.co/benchmarks/evidence/local-ollama-rtx-5080-2026-05-28-turkish-sweep/kumru-2b/evidence.json",
    "command": "POST http://localhost:11434/api/generate model=alibayram/kumru:latest temperature=0 seed=42 num_ctx=2048 num_predict=512",
    "outputHash": "12c8d822940557b9a8381fcd5594d09e62b5ca1bcc036192447ba812eb8d688d",
    "sourceFileSha256": "897d20358d0a41bb640d93209207220980320a91618c1f3a18a382dbbe22e414",
    "sourceResultSha256": "6ffc8a6782bb9e94aa30524c89da9867d4caa5829a043f932e661c2d3b91d037",
    "artifactHashSha256": "a099071b5ad93fb33c56cefdfb50e3e7516800527fa4c3b7ca7c3e14033eaae0",
    "logHashSha256": "a099071b5ad93fb33c56cefdfb50e3e7516800527fa4c3b7ca7c3e14033eaae0",
    "logHashNote": "Structured Ollama API sweep hash. No separate verbose text logs were captured for this sweep.",
    "intakeVersion": "V39.0-ollama-tps-sweep",
    "capturedAt": "2026-05-28T05:13:10.545Z"
  },
  "rawResult": {
    "model": "alibayram/kumru:latest",
    "model_slug": "kumru-2b",
    "is_turkish_model": true,
    "family": "llama",
    "parameter_size": "2.4B",
    "quantization_level": "Q4_K_M",
    "model_size_bytes": 1458559332,
    "digest": "04f3c85761dd4f928a33a739d47924674f2b034d511664213b3576934c7078e6",
    "scores_generation_tps": [
      446,
      397.42,
      443.66,
      406.67,
      454.33
    ],
    "mean_generation_tps": 429.62,
    "median_generation_tps": 443.66,
    "min_generation_tps": 397.42,
    "max_generation_tps": 454.33,
    "runs": [
      {
        "run": 1,
        "generated_tokens": 448,
        "prompt_tokens": 71,
        "eval_duration_ns": 1004482900,
        "prompt_eval_duration_ns": 10342400,
        "total_duration_ns": 1345170800,
        "wall_ms": 1351,
        "generation_tps": 446,
        "total_tps": 333.04,
        "done_reason": "stop",
        "response_sha256": "9c81ca4dbcb99536b8e68d42b6eae56a6c289da1221339bb9a0c9e5b119f147e"
      },
      {
        "run": 2,
        "generated_tokens": 512,
        "prompt_tokens": 71,
        "eval_duration_ns": 1288298900,
        "prompt_eval_duration_ns": 4317700,
        "total_duration_ns": 1587300400,
        "wall_ms": 1594,
        "generation_tps": 397.42,
        "total_tps": 322.56,
        "done_reason": "length",
        "response_sha256": "155f9afef04b13be580019c31e47cd7e8ccf7eca4da219a033c1037301485ac0"
      },
      {
        "run": 3,
        "generated_tokens": 512,
        "prompt_tokens": 71,
        "eval_duration_ns": 1154034400,
        "prompt_eval_duration_ns": 3903000,
        "total_duration_ns": 1525786600,
        "wall_ms": 1531,
        "generation_tps": 443.66,
        "total_tps": 335.56,
        "done_reason": "length",
        "response_sha256": "155f9afef04b13be580019c31e47cd7e8ccf7eca4da219a033c1037301485ac0"
      },
      {
        "run": 4,
        "generated_tokens": 512,
        "prompt_tokens": 71,
        "eval_duration_ns": 1259002800,
        "prompt_eval_duration_ns": 3279100,
        "total_duration_ns": 1552698000,
        "wall_ms": 1557,
        "generation_tps": 406.67,
        "total_tps": 329.75,
        "done_reason": "length",
        "response_sha256": "155f9afef04b13be580019c31e47cd7e8ccf7eca4da219a033c1037301485ac0"
      },
      {
        "run": 5,
        "generated_tokens": 512,
        "prompt_tokens": 71,
        "eval_duration_ns": 1126932100,
        "prompt_eval_duration_ns": 3218600,
        "total_duration_ns": 1491845100,
        "wall_ms": 1496,
        "generation_tps": 454.33,
        "total_tps": 343.2,
        "done_reason": "length",
        "response_sha256": "155f9afef04b13be580019c31e47cd7e8ccf7eca4da219a033c1037301485ac0"
      }
    ]
  }
}