diff --git a/csrc/cache_kernels.cu b/csrc/cache_kernels.cu index d06eac2b..0b3f6fc8 100644 --- a/csrc/cache_kernels.cu +++ b/csrc/cache_kernels.cu @@ -350,8 +350,8 @@ __global__ void concat_and_cache_mla_kernel( } // namespace vllm -// KV_T is the stored data type of kv-cache. -// CACHE_T is the data type of key and value tensors. +// KV_T is the data type of key and value tensors. +// CACHE_T is the stored data type of kv-cache. // KV_DTYPE is the real data type of kv-cache. #define CALL_RESHAPE_AND_CACHE(KV_T, CACHE_T, KV_DTYPE) \ vllm::reshape_and_cache_kernel \ @@ -393,8 +393,8 @@ void reshape_and_cache( CALL_RESHAPE_AND_CACHE) } -// KV_T is the stored data type of kv-cache. -// CACHE_T is the data type of key and value tensors. +// KV_T is the data type of key and value tensors. +// CACHE_T is the stored data type of kv-cache. // KV_DTYPE is the real data type of kv-cache. #define CALL_RESHAPE_AND_CACHE_FLASH(KV_T, CACHE_T, KV_DTYPE) \ vllm::reshape_and_cache_flash_kernel \ @@ -446,8 +446,8 @@ void reshape_and_cache_flash( CALL_RESHAPE_AND_CACHE_FLASH); } -// KV_T is the stored data type of kv-cache. -// CACHE_T is the data type of key and value tensors. +// KV_T is the data type of key and value tensors. +// CACHE_T is the stored data type of kv-cache. // KV_DTYPE is the real data type of kv-cache. #define CALL_CONCAT_AND_CACHE_MLA(KV_T, CACHE_T, KV_DTYPE) \ vllm::concat_and_cache_mla_kernel \