We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4829137 commit e24e0d8Copy full SHA for e24e0d8
deploy/config/epp-precise-prefix-cache-config.yaml
@@ -13,7 +13,7 @@ plugins:
13
hashSeed: "42" # must match vLLM PYTHONHASHSEED env var
14
kvBlockIndexConfig:
15
enableMetrics: true # enable kv-block index metrics (prometheus)
16
- - type: kv-cache-scorer # kv-cache-utilization
+ - type: kv-cache-utilization-scorer
17
- type: queue-scorer
18
- type: max-score-picker
19
schedulingProfiles:
@@ -22,7 +22,7 @@ schedulingProfiles:
22
- pluginRef: decode-filter
23
- pluginRef: precise-prefix-cache-scorer
24
weight: 2.0
25
- - pluginRef: kv-cache-scorer
+ - pluginRef: kv-cache-utilization-scorer
26
weight: 1.0
27
- pluginRef: queue-scorer
28
0 commit comments