{ "runId": "run_ab0f70bd-9ccf-4b30-b253-f808d8d1201d", "bundleId": "llamacpp-gemma-4-e4b-it-q8_0.gguf-d8c24c", "status": "verified", "promptTokens": 40960, "completionTokens": 10240, "contextLength": 5120, "harness": { "version": "0.1.21", "gitSha": "unknown" }, "runtime": { "name": "llama.cpp", "version": "b8796", "buildFlags": "metal" }, "model": { "displayName": "Gemma 4 E4B IT", "format": "gguf", "quant": "q8_0", "architecture": "gemma4", "source": "unsloth/gemma-4-E4B-it-GGUF:gemma-4-E4B-it-Q8_0.gguf", "fileSizeBytes": 8192950976, "lab": { "name": "Google", "slug": "google" }, "quantizedBy": { "name": "Unsloth", "slug": "unsloth" } }, "device": { "cpu": "12th Gen Intel(R) Core(TM) i7-12700F", "cpuCores": 20, "gpu": "NVIDIA GeForce RTX 3060", "gpuCores": 0, "gpuCount": 1, "ramGb": 16, "osName": "Ubuntu 22.04.2 LTS", "osVersion": "22.04" }, "decodeTpsMean": 50.2, "prefillTpsMean": 2608.7, "ttftP50Ms": 1571.46, "idleTpsMean": 4197.3, "peakRssMb": 8142.1, "trialsPassed": 10, "trialsTotal": 10, "runnabilityScore": 0.6775370661272322, "bundleSha256": "eb17e1d389acf7de5abdb91024aa5bf9d156fd25c6b07da19c9ca2cb1847a5a1", "createdAt": "2026-04-14T16:28:07.389Z"}