Skip to content

Commit

Permalink
Merge branch 'main' into Mixtral8x7b_MoE_Config
Browse files Browse the repository at this point in the history
  • Loading branch information
Jacob0226 authored Nov 18, 2024
2 parents e49b6c4 + efb0432 commit f5d34d2
Show file tree
Hide file tree
Showing 3 changed files with 22 additions and 22 deletions.
1 change: 0 additions & 1 deletion benchmarks/P3L.py
Original file line number Diff line number Diff line change
Expand Up @@ -83,7 +83,6 @@ def vllm_init(args):
sampling_params = SamplingParams(n=1,
temperature=0.0,
top_p=1,
use_beam_search=False,
ignore_eos=True,
ppl_measurement=True,
future_context=[],
Expand Down
3 changes: 2 additions & 1 deletion vllm/attention/backends/rocm_flash_attn.py
Original file line number Diff line number Diff line change
Expand Up @@ -619,7 +619,8 @@ def forward(
# QKV for prefill.
query = query[:num_prefill_tokens]

if key is not None and value is not None:
if key is not None and value is not None \
and attn_type != AttentionType.ENCODER_DECODER:
key = key[:num_prefill_tokens]
value = value[:num_prefill_tokens]

Expand Down
40 changes: 20 additions & 20 deletions vllm/attention/ops/triton_flash_attention.py
Original file line number Diff line number Diff line change
Expand Up @@ -314,26 +314,26 @@ def attn_fwd(
sm_scale,
L,
Out,
stride_qz,
stride_qh,
stride_qm,
stride_qk,
stride_kz,
stride_kh,
stride_kn,
stride_kk,
stride_vz,
stride_vh,
stride_vk,
stride_vn,
stride_oz,
stride_oh,
stride_om,
stride_on,
stride_bz,
stride_bh,
stride_bm,
stride_bn,
stride_qz: tl.int64,
stride_qh: tl.int64,
stride_qm: tl.int64,
stride_qk: tl.int64,
stride_kz: tl.int64,
stride_kh: tl.int64,
stride_kn: tl.int64,
stride_kk: tl.int64,
stride_vz: tl.int64,
stride_vh: tl.int64,
stride_vk: tl.int64,
stride_vn: tl.int64,
stride_oz: tl.int64,
stride_oh: tl.int64,
stride_om: tl.int64,
stride_on: tl.int64,
stride_bz: tl.int64,
stride_bh: tl.int64,
stride_bm: tl.int64,
stride_bn: tl.int64,
cu_seqlens_q,
cu_seqlens_k,
dropout_p,
Expand Down

0 comments on commit f5d34d2

Please sign in to comment.