@@ -404,7 +404,8 @@ func TestPromToPodMetrics(t *testing.T) {
404
404
expectedMetrics : & Metrics {
405
405
WaitingQueueSize : 7 ,
406
406
KVCacheUsagePercent : 0.8 ,
407
- ActiveModels : map [string ]int {"lora1" : 0 , "lora2" : 0 , "lora3" : 0 },
407
+ ActiveModels : map [string ]int {"lora1" : 0 , "lora2" : 0 },
408
+ WaitingModels : map [string ]int {"lora3" : 0 },
408
409
MaxActiveModels : 3 ,
409
410
},
410
411
},
@@ -416,8 +417,8 @@ func TestPromToPodMetrics(t *testing.T) {
416
417
KVCacheUtilization : & MetricSpec {MetricName : "vllm_usage" },
417
418
LoraRequestInfo : & MetricSpec {MetricName : "vllm:lora_requests_info" },
418
419
},
419
- existingMetrics : & Metrics {ActiveModels : map [string ]int {}},
420
- expectedMetrics : & Metrics {ActiveModels : map [string ]int {}},
420
+ existingMetrics : & Metrics {ActiveModels : map [string ]int {}, WaitingModels : map [ string ] int {} },
421
+ expectedMetrics : & Metrics {ActiveModels : map [string ]int {}, WaitingModels : map [ string ] int {} },
421
422
expectedErr : multierr .Combine (errors .New ("metric family \" vllm_waiting\" not found" ), errors .New ("metric family \" vllm_usage\" not found" ), errors .New ("metric family \" vllm:lora_requests_info\" not found" )),
422
423
},
423
424
{
@@ -439,7 +440,8 @@ func TestPromToPodMetrics(t *testing.T) {
439
440
expectedMetrics : & Metrics {
440
441
WaitingQueueSize : 0 ,
441
442
KVCacheUsagePercent : 0.8 ,
442
- ActiveModels : map [string ]int {"lora1" : 0 , "lora2" : 0 , "lora3" : 0 },
443
+ ActiveModels : map [string ]int {"lora1" : 0 , "lora2" : 0 },
444
+ WaitingModels : map [string ]int {"lora3" : 0 },
443
445
MaxActiveModels : 3 ,
444
446
},
445
447
expectedErr : errors .New ("metric family \" vllm_waiting\" not found" ),
@@ -457,6 +459,7 @@ func TestPromToPodMetrics(t *testing.T) {
457
459
existingMetrics : & Metrics {},
458
460
expectedMetrics : & Metrics {
459
461
ActiveModels : map [string ]int {"lora1" : 0 },
462
+ WaitingModels : map [string ]int {},
460
463
MaxActiveModels : 0 , // Should still default to 0.
461
464
462
465
},
0 commit comments