Skip to content

Commit

Permalink
unconst
Browse files Browse the repository at this point in the history
  • Loading branch information
grimoire committed Dec 9, 2024
1 parent 240f352 commit a65007b
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions lmdeploy/pytorch/kernels/cuda/flatten_kv_cache.py
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,7 @@ def _flatten_kv_cache(
stride_vos: tl.constexpr,
stride_vod: tl.constexpr,
stride_boff,
OUT_SIZE: tl.constexpr,
OUT_SIZE,
HEAD_DIM_K: tl.constexpr,
HEAD_DIM_V: tl.constexpr,
BLOCK_BS: tl.constexpr,
Expand Down Expand Up @@ -124,7 +124,7 @@ def _flatten_kv_cache_quant(
stride_vod: tl.constexpr,
stride_boff,
quant_policy: tl.constexpr,
OUT_SIZE: tl.constexpr,
OUT_SIZE,
HEAD_DIM_K: tl.constexpr,
HEAD_DIM_V: tl.constexpr,
BLOCK_BS: tl.constexpr,
Expand Down

0 comments on commit a65007b

Please sign in to comment.