|
106 | 106 | "type": "prometheus", |
107 | 107 | "uid": "prometheus" |
108 | 108 | }, |
109 | | - "expr": "histogram_quantile(0.50, sum(rate(llm_latency_ms_milliseconds_bucket[5m])) by (le, llm_class))", |
| 109 | + "expr": "histogram_quantile(0.50, sum(rate(llm_latency_ms_bucket[5m])) by (le, llm_class))", |
110 | 110 | "legendFormat": "p50 - {{llm_class}}", |
111 | 111 | "refId": "A" |
112 | 112 | }, |
|
115 | 115 | "type": "prometheus", |
116 | 116 | "uid": "prometheus" |
117 | 117 | }, |
118 | | - "expr": "histogram_quantile(0.95, sum(rate(llm_latency_ms_milliseconds_bucket[5m])) by (le, llm_class))", |
| 118 | + "expr": "histogram_quantile(0.95, sum(rate(llm_latency_ms_bucket[5m])) by (le, llm_class))", |
119 | 119 | "legendFormat": "p95 - {{llm_class}}", |
120 | 120 | "refId": "B" |
121 | 121 | }, |
|
124 | 124 | "type": "prometheus", |
125 | 125 | "uid": "prometheus" |
126 | 126 | }, |
127 | | - "expr": "histogram_quantile(0.99, sum(rate(llm_latency_ms_milliseconds_bucket[5m])) by (le, llm_class))", |
| 127 | + "expr": "histogram_quantile(0.99, sum(rate(llm_latency_ms_bucket[5m])) by (le, llm_class))", |
128 | 128 | "legendFormat": "p99 - {{llm_class}}", |
129 | 129 | "refId": "C" |
130 | 130 | } |
|
216 | 216 | "type": "prometheus", |
217 | 217 | "uid": "prometheus" |
218 | 218 | }, |
219 | | - "expr": "histogram_quantile(0.50, sum(rate(stt_latency_ms_milliseconds_bucket[5m])) by (le, stt_class))", |
| 219 | + "expr": "histogram_quantile(0.50, sum(rate(stt_latency_ms_bucket[5m])) by (le, stt_class))", |
220 | 220 | "legendFormat": "p50 - {{stt_class}}", |
221 | 221 | "refId": "A" |
222 | 222 | }, |
|
225 | 225 | "type": "prometheus", |
226 | 226 | "uid": "prometheus" |
227 | 227 | }, |
228 | | - "expr": "histogram_quantile(0.95, sum(rate(stt_latency_ms_milliseconds_bucket[5m])) by (le, stt_class))", |
| 228 | + "expr": "histogram_quantile(0.95, sum(rate(stt_latency_ms_bucket[5m])) by (le, stt_class))", |
229 | 229 | "legendFormat": "p95 - {{stt_class}}", |
230 | 230 | "refId": "B" |
231 | 231 | }, |
|
234 | 234 | "type": "prometheus", |
235 | 235 | "uid": "prometheus" |
236 | 236 | }, |
237 | | - "expr": "histogram_quantile(0.99, sum(rate(stt_latency_ms_milliseconds_bucket[5m])) by (le, stt_class))", |
| 237 | + "expr": "histogram_quantile(0.99, sum(rate(stt_latency_ms_bucket[5m])) by (le, stt_class))", |
238 | 238 | "legendFormat": "p99 - {{stt_class}}", |
239 | 239 | "refId": "C" |
240 | 240 | } |
|
326 | 326 | "type": "prometheus", |
327 | 327 | "uid": "prometheus" |
328 | 328 | }, |
329 | | - "expr": "histogram_quantile(0.50, sum(rate(tts_latency_ms_milliseconds_bucket[5m])) by (le, tts_class))", |
| 329 | + "expr": "histogram_quantile(0.50, sum(rate(tts_latency_ms_bucket[5m])) by (le, tts_class))", |
330 | 330 | "legendFormat": "p50 - {{tts_class}}", |
331 | 331 | "refId": "A" |
332 | 332 | }, |
|
335 | 335 | "type": "prometheus", |
336 | 336 | "uid": "prometheus" |
337 | 337 | }, |
338 | | - "expr": "histogram_quantile(0.95, sum(rate(tts_latency_ms_milliseconds_bucket[5m])) by (le, tts_class))", |
| 338 | + "expr": "histogram_quantile(0.95, sum(rate(tts_latency_ms_bucket[5m])) by (le, tts_class))", |
339 | 339 | "legendFormat": "p95 - {{tts_class}}", |
340 | 340 | "refId": "B" |
341 | 341 | }, |
|
344 | 344 | "type": "prometheus", |
345 | 345 | "uid": "prometheus" |
346 | 346 | }, |
347 | | - "expr": "histogram_quantile(0.99, sum(rate(tts_latency_ms_milliseconds_bucket[5m])) by (le, tts_class))", |
| 347 | + "expr": "histogram_quantile(0.99, sum(rate(tts_latency_ms_bucket[5m])) by (le, tts_class))", |
348 | 348 | "legendFormat": "p99 - {{tts_class}}", |
349 | 349 | "refId": "C" |
350 | 350 | } |
|
436 | 436 | "type": "prometheus", |
437 | 437 | "uid": "prometheus" |
438 | 438 | }, |
439 | | - "expr": "histogram_quantile(0.50, sum(rate(turn_detection_latency_ms_milliseconds_bucket[5m])) by (le, provider))", |
| 439 | + "expr": "histogram_quantile(0.50, sum(rate(turn_detection_latency_ms_bucket[5m])) by (le, provider))", |
440 | 440 | "legendFormat": "p50 - {{provider}}", |
441 | 441 | "refId": "A" |
442 | 442 | }, |
|
445 | 445 | "type": "prometheus", |
446 | 446 | "uid": "prometheus" |
447 | 447 | }, |
448 | | - "expr": "histogram_quantile(0.95, sum(rate(turn_detection_latency_ms_milliseconds_bucket[5m])) by (le, provider))", |
| 448 | + "expr": "histogram_quantile(0.95, sum(rate(turn_detection_latency_ms_bucket[5m])) by (le, provider))", |
449 | 449 | "legendFormat": "p95 - {{provider}}", |
450 | 450 | "refId": "B" |
451 | 451 | }, |
|
454 | 454 | "type": "prometheus", |
455 | 455 | "uid": "prometheus" |
456 | 456 | }, |
457 | | - "expr": "histogram_quantile(0.99, sum(rate(turn_detection_latency_ms_milliseconds_bucket[5m])) by (le, provider))", |
| 457 | + "expr": "histogram_quantile(0.99, sum(rate(turn_detection_latency_ms_bucket[5m])) by (le, provider))", |
458 | 458 | "legendFormat": "p99 - {{provider}}", |
459 | 459 | "refId": "C" |
460 | 460 | } |
|
546 | 546 | "type": "prometheus", |
547 | 547 | "uid": "prometheus" |
548 | 548 | }, |
549 | | - "expr": "histogram_quantile(0.50, sum(rate(turn_vad_latency_ms_milliseconds_bucket[5m])) by (le, implementation))", |
| 549 | + "expr": "histogram_quantile(0.50, sum(rate(turn_vad_latency_ms_bucket[5m])) by (le, implementation))", |
550 | 550 | "legendFormat": "p50 - {{implementation}}", |
551 | 551 | "refId": "A" |
552 | 552 | }, |
|
555 | 555 | "type": "prometheus", |
556 | 556 | "uid": "prometheus" |
557 | 557 | }, |
558 | | - "expr": "histogram_quantile(0.95, sum(rate(turn_vad_latency_ms_milliseconds_bucket[5m])) by (le, implementation))", |
| 558 | + "expr": "histogram_quantile(0.95, sum(rate(turn_vad_latency_ms_bucket[5m])) by (le, implementation))", |
559 | 559 | "legendFormat": "p95 - {{implementation}}", |
560 | 560 | "refId": "B" |
561 | 561 | }, |
|
564 | 564 | "type": "prometheus", |
565 | 565 | "uid": "prometheus" |
566 | 566 | }, |
567 | | - "expr": "histogram_quantile(0.99, sum(rate(turn_vad_latency_ms_milliseconds_bucket[5m])) by (le, implementation))", |
| 567 | + "expr": "histogram_quantile(0.99, sum(rate(turn_vad_latency_ms_bucket[5m])) by (le, implementation))", |
568 | 568 | "legendFormat": "p99 - {{implementation}}", |
569 | 569 | "refId": "C" |
570 | 570 | } |
|
656 | 656 | "type": "prometheus", |
657 | 657 | "uid": "prometheus" |
658 | 658 | }, |
659 | | - "expr": "histogram_quantile(0.50, sum(rate(turn_end_detection_latency_ms_milliseconds_bucket[5m])) by (le, implementation))", |
| 659 | + "expr": "histogram_quantile(0.50, sum(rate(turn_end_detection_latency_ms_bucket[5m])) by (le, implementation))", |
660 | 660 | "legendFormat": "p50 - {{implementation}}", |
661 | 661 | "refId": "A" |
662 | 662 | }, |
|
665 | 665 | "type": "prometheus", |
666 | 666 | "uid": "prometheus" |
667 | 667 | }, |
668 | | - "expr": "histogram_quantile(0.95, sum(rate(turn_end_detection_latency_ms_milliseconds_bucket[5m])) by (le, implementation))", |
| 668 | + "expr": "histogram_quantile(0.95, sum(rate(turn_end_detection_latency_ms_bucket[5m])) by (le, implementation))", |
669 | 669 | "legendFormat": "p95 - {{implementation}}", |
670 | 670 | "refId": "B" |
671 | 671 | }, |
|
674 | 674 | "type": "prometheus", |
675 | 675 | "uid": "prometheus" |
676 | 676 | }, |
677 | | - "expr": "histogram_quantile(0.99, sum(rate(turn_end_detection_latency_ms_milliseconds_bucket[5m])) by (le, implementation))", |
| 677 | + "expr": "histogram_quantile(0.99, sum(rate(turn_end_detection_latency_ms_bucket[5m])) by (le, implementation))", |
678 | 678 | "legendFormat": "p99 - {{implementation}}", |
679 | 679 | "refId": "C" |
680 | 680 | } |
|
0 commit comments