fix copy-pasted block comment

daniel-geon-park · daniel-geon-park · commit 63fee4f9c2a4 · 2025-01-29T06:58:39.000+09:00
diff --git a/python/sglang/srt/layers/attention/hip_radix_attention.py b/python/sglang/srt/layers/attention/hip_radix_attention.py
@@ -1,10 +1,8 @@
 from __future__ import annotations
 
 """
-Support different attention backends.
-Now there are two backends: FlashInfer and Triton.
-FlashInfer is faster and Triton is easier to customize.
-Each backend supports two operators: extend (i.e. prefill with cached prefix) and decode.
+HiP Attention Backend for SGLang
+https://arxiv.org/pdf/2406.09827
 """
 
 import logging