{ "host": "matt-strix", "gpu": "AMD Strix Halo iGPU", "vram_gb": null, "model_alias": "gemma4:31b", "model_tag": "gemma4:31b", "prompt_key": "long", "prompt_chars": 1614, "num_predict": 256, "num_ctx": 4096, "runs": [ { "prompt_tokens": 319, "prompt_eval_ms": 97.2, "prefill_tok_per_s": 3282.33, "output_tokens": 256, "eval_ms": 24566.1, "decode_tok_per_s": 10.42, "load_ms": 157.2, "total_ms": 24879.5, "harness_wall_s": 24.945, "done_reason": "length" }, { "prompt_tokens": 319, "prompt_eval_ms": 97.3, "prefill_tok_per_s": 3277.8, "output_tokens": 256, "eval_ms": 24560.7, "decode_tok_per_s": 10.42, "load_ms": 162.3, "total_ms": 24880.5, "harness_wall_s": 24.943, "done_reason": "length" }, { "prompt_tokens": 319, "prompt_eval_ms": 97.4, "prefill_tok_per_s": 3274.93, "output_tokens": 256, "eval_ms": 24559.5, "decode_tok_per_s": 10.42, "load_ms": 157.1, "total_ms": 24876.8, "harness_wall_s": 24.94, "done_reason": "length" } ], "warmup": { "prompt_tokens": 319, "prompt_eval_ms": 1052.0, "prefill_tok_per_s": 303.23, "output_tokens": 256, "eval_ms": 24563.0, "decode_tok_per_s": 10.42, "load_ms": 167.6, "total_ms": 25843.0, "harness_wall_s": 25.896, "done_reason": "length" }, "summary": { "prefill_tok_per_s": { "min": 3274.93, "median": 3277.8, "max": 3282.33, "n": 3 }, "decode_tok_per_s": { "min": 10.42, "median": 10.42, "max": 10.42, "n": 3 }, "total_ms": { "min": 24876.8, "median": 24879.5, "max": 24880.5, "n": 3 } } }