{ "runId": "run_9f13babf-cd2c-421e-a19e-829f2c059a63", "bundleId": "llamacpp-gemma-4-e4b-it-q8_0.gguf-712cd1", "status": "verified", "promptTokens": 40960, "completionTokens": 10240, "contextLength": 5120, "harness": { "version": "0.1.21", "gitSha": "unknown" }, "runtime": { "name": "llama.cpp", "version": "b8680", "buildFlags": "metal" }, "model": { "displayName": "Gemma 4 E4B IT", "format": "gguf", "quant": "q8_0", "architecture": "gemma4", "source": "unsloth/gemma-4-E4B-it-GGUF:gemma-4-E4B-it-Q8_0.gguf", "fileSizeBytes": 8192950976, "lab": { "name": "Google", "slug": "google" }, "quantizedBy": { "name": "Unsloth", "slug": "unsloth" } }, "device": { "cpu": "12th Gen Intel(R) Core(TM) i7-12700F", "cpuCores": 20, "gpu": "NVIDIA GeForce RTX 3060", "gpuCores": 0, "gpuCount": 1, "ramGb": 16, "osName": "Ubuntu 22.04.2 LTS", "osVersion": "22.04" }, "decodeTpsMean": 7.8, "prefillTpsMean": 38.4, "ttftP50Ms": 108851.64, "idleTpsMean": 7160.1, "peakRssMb": 7408.6, "trialsPassed": 10, "trialsTotal": 10, "runnabilityScore": 0.25620640345982143, "bundleSha256": "68d443a8d07790eceea1f656c23b4efbd3a515a0f529ef915115be0376774889", "createdAt": "2026-04-14T15:16:46.739Z"}