|
| 1 | +# HELP llmservice_model_request_duration_seconds [ALPHA] LLM service response latency distribution in seconds for each model and target model. |
| 2 | +# TYPE llmservice_model_request_duration_seconds histogram |
| 3 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="0.005"} 0 |
| 4 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="0.025"} 1 |
| 5 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="0.05"} 1 |
| 6 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="0.1"} 1 |
| 7 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="0.2"} 1 |
| 8 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="0.4"} 1 |
| 9 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="0.6"} 1 |
| 10 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="0.8"} 1 |
| 11 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="1.0"} 1 |
| 12 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="1.25"} 1 |
| 13 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="1.5"} 1 |
| 14 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="2"} 2 |
| 15 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="3"} 2 |
| 16 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="4"} 2 |
| 17 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="5"} 2 |
| 18 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="6"} 2 |
| 19 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="8"} 2 |
| 20 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="10"} 2 |
| 21 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="15"} 2 |
| 22 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="20"} 2 |
| 23 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="30"} 2 |
| 24 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="45"} 2 |
| 25 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="60"} 2 |
| 26 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="120"} 2 |
| 27 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="180"} 2 |
| 28 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="240"} 2 |
| 29 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="300"} 2 |
| 30 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="360"} 2 |
| 31 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="480"} 2 |
| 32 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="600"} 2 |
| 33 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="900"} 2 |
| 34 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="1200"} 2 |
| 35 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="1800"} 2 |
| 36 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="2700"} 2 |
| 37 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="3600"} 2 |
| 38 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10", model_name="m10", target_model_name="t10", le="Inf"} 2 |
| 39 | +llmservice_model_request_duration_seconds_sum{llmservice_name="s10", model_name="m10", target_model_name="t10"} 1.61 |
| 40 | +llmservice_model_request_duration_seconds_count{llmservice_name="s10", model_name="m10", target_model_name="t10"} 2 |
| 41 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="0.005"} 0 |
| 42 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="0.025"} 0 |
| 43 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="0.05"} 0 |
| 44 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="0.1"} 1 |
| 45 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="0.2"} 1 |
| 46 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="0.4"} 1 |
| 47 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="0.6"} 1 |
| 48 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="0.8"} 1 |
| 49 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="1"} 1 |
| 50 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="1.25"} 1 |
| 51 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="1.5"} 1 |
| 52 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="2"} 1 |
| 53 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="3"} 1 |
| 54 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="4"} 1 |
| 55 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="5"} 1 |
| 56 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="6"} 1 |
| 57 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="8"} 1 |
| 58 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="10"} 1 |
| 59 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="15"} 1 |
| 60 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="20"} 1 |
| 61 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="30"} 1 |
| 62 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="45"} 1 |
| 63 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="60"} 1 |
| 64 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="120"} 1 |
| 65 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="180"} 1 |
| 66 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="240"} 1 |
| 67 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="300"} 1 |
| 68 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="360"} 1 |
| 69 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="480"} 1 |
| 70 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="600"} 1 |
| 71 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="900"} 1 |
| 72 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="1200"} 1 |
| 73 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="1800"} 1 |
| 74 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="2700"} 1 |
| 75 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="3600"} 1 |
| 76 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s10",model_name="m10",target_model_name="t11",le="+Inf"} 1 |
| 77 | +llmservice_model_request_duration_seconds_sum{llmservice_name="s10",model_name="m10",target_model_name="t11"} 0.06 |
| 78 | +llmservice_model_request_duration_seconds_count{llmservice_name="s10",model_name="m10",target_model_name="t11"} 1 |
| 79 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="0.005"} 0 |
| 80 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="0.025"} 0 |
| 81 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="0.05"} 0 |
| 82 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="0.1"} 0 |
| 83 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="0.2"} 1 |
| 84 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="0.4"} 1 |
| 85 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="0.6"} 1 |
| 86 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="0.8"} 1 |
| 87 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="1"} 1 |
| 88 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="1.25"} 1 |
| 89 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="1.5"} 1 |
| 90 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="2"} 1 |
| 91 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="3"} 1 |
| 92 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="4"} 1 |
| 93 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="5"} 1 |
| 94 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="6"} 1 |
| 95 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="8"} 1 |
| 96 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="10"} 1 |
| 97 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="15"} 1 |
| 98 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="20"} 1 |
| 99 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="30"} 1 |
| 100 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="45"} 1 |
| 101 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="60"} 1 |
| 102 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="120"} 1 |
| 103 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="180"} 1 |
| 104 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="240"} 1 |
| 105 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="300"} 1 |
| 106 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="360"} 1 |
| 107 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="480"} 1 |
| 108 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="600"} 1 |
| 109 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="900"} 1 |
| 110 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="1200"} 1 |
| 111 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="1800"} 1 |
| 112 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="2700"} 1 |
| 113 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="3600"} 1 |
| 114 | +llmservice_model_request_duration_seconds_bucket{llmservice_name="s20",model_name="m20",target_model_name="t20",le="+Inf"} 1 |
| 115 | +llmservice_model_request_duration_seconds_sum{llmservice_name="s20",model_name="m20",target_model_name="t20"} 0.12 |
| 116 | +llmservice_model_request_duration_seconds_count{llmservice_name="s20",model_name="m20",target_model_name="t20"} 1 |
0 commit comments