File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -26,7 +26,7 @@ ucm_connectors:
2626
2727# When you use UcmNfsStore, you should set enable_event_sync to false.
2828enable_event_sync : true
29- # Use event from vllm ascend to do D2H immediatly after kv cache dump .
29+ # Use vLLM-Ascend reshape cache events to start D2H immediately after KV cache is ready .
3030# Enable for better dump performance.
3131enable_reshape_cache_event_sync : false
3232# Enable UCM metrics so they can be monitored online via Grafana and Prometheus.
Original file line number Diff line number Diff line change @@ -882,13 +882,9 @@ def _get_dump_event_handle(
882882 event_handle = self .device .get_event_handle ()
883883 if event_handle == 0 :
884884 self .device .synchronize ()
885- ucmmetrics .update_stats (
886- "dump_event_sync_fallback_used_total" , 1.0
887- )
885+ ucmmetrics .update_stats ("dump_event_sync_fallback_used_total" , 1.0 )
888886 else :
889- ucmmetrics .update_stats (
890- "dump_event_current_stream_used_total" , 1.0
891- )
887+ ucmmetrics .update_stats ("dump_event_current_stream_used_total" , 1.0 )
892888 return event_handle
893889
894890 def save_kv_layer (
You can’t perform that action at this time.
0 commit comments