Skip to content

Commit 8167f53

Browse files
committed
Fix reshape event sync formatting
1 parent 5100ee1 commit 8167f53

2 files changed

Lines changed: 3 additions & 7 deletions

File tree

examples/ucm_config_example.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@ ucm_connectors:
2626

2727
# When you use UcmNfsStore, you should set enable_event_sync to false.
2828
enable_event_sync: true
29-
# Use event from vllm ascend to do D2H immediatly after kv cache dump.
29+
# Use vLLM-Ascend reshape cache events to start D2H immediately after KV cache is ready.
3030
# Enable for better dump performance.
3131
enable_reshape_cache_event_sync: false
3232
# Enable UCM metrics so they can be monitored online via Grafana and Prometheus.

ucm/integration/vllm/ucm_connector.py

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -882,13 +882,9 @@ def _get_dump_event_handle(
882882
event_handle = self.device.get_event_handle()
883883
if event_handle == 0:
884884
self.device.synchronize()
885-
ucmmetrics.update_stats(
886-
"dump_event_sync_fallback_used_total", 1.0
887-
)
885+
ucmmetrics.update_stats("dump_event_sync_fallback_used_total", 1.0)
888886
else:
889-
ucmmetrics.update_stats(
890-
"dump_event_current_stream_used_total", 1.0
891-
)
887+
ucmmetrics.update_stats("dump_event_current_stream_used_total", 1.0)
892888
return event_handle
893889

894890
def save_kv_layer(

0 commit comments

Comments
 (0)