{
"benchmark": "responses_stream_ttft",
"generatedAt": "2026-03-31T23:34:32.387Z",
"config": {
"baseUrl": "https://apigw.mka1.com/api/v1/llm",
"model": "gpt-5",
"apiKey": "OMITTED",
"onBehalfOf": "ttft-benchmark-user",
"prompt": "Reply with exactly the text OK and nothing else.",
"samples": 100,
"warmupSamples": 5,
"concurrency": 1,
"timeoutMs": 45000,
"thresholdMs": 1000,
"maxOutputTokens": 64,
"outputJson": "stream-ttft-report.json"
},
"verdict": {
"passed": true,
"thresholdMs": 1000,
"measuredP95Ms": 608.4879000000001
},
"samples": {
"warmup": 5,
"measured": 100,
"success": 100,
"failed": 0
},
"stats": {
"headersMs": {
"count": 100,
"min": 63.00436899999477,
"avg": 67.39161819000238,
"p50": 67.0498840000073,
"p95": 70.41907800000627,
"p99": 72.71200100000715,
"max": 107.99611500000174
},
"firstEventMs": {
"count": 100,
"min": 63.306459000014,
"avg": 67.66752371000103,
"p50": 67.35425400000531,
"p95": 70.69219799997518,
"p99": 73.02295199999935,
"max": 108.39853500000027
},
"firstTokenMs": {
"count": 100,
"min": 293.89441600002465,
"avg": 389.9065817800009,
"p50": 311.1333589999995,
"p95": 608.4879000000001,
"p99": 681.2876299999916,
"max": 695.8577790000054
},
"totalDurationMs": {
"count": 100,
"min": 3047.5074070000264,
"avg": 3146.770197100002,
"p50": 3097.0465299999996,
"p95": 3374.5328960000006,
"p99": 3435.1036190000013,
"max": 3453.2585250000047
}
},
"measurements": [
{
"sampleIndex": 1,
"ok": true,
"httpStatus": 200,
"responseId": "resp_c38d48bebeb74c54b740e627a541cad6",
"headersMs": 66.99634399999923,
"firstEventMs": 67.28057400000034,
"firstTokenMs": 423.95566899999903,
"totalDurationMs": 3195.7519509999984,
"eventCount": 137,
"textDeltaCount": 62,
"outputTextDeltaCount": 0,
"reasoningTextDeltaCount": 62,
"text": "Okay o usuário pediu para responder exatamente com \"OK\" e nada mais. Vou verificar se entendi corretamente. Ele quer que eu ignore qualquer outra coisa e só envie \"OK\". Não há necessidade de usar nenhuma ferramenta aqui, já que a resposta é"
},
...
]
}