fix: expand shape of attn_mask (#10)

JackWeiw · jinminxi104 · commit 220ceb2c13ae · 2024-08-22T23:35:11.000+08:00
diff --git a/lmdeploy/pytorch/engine/devices/ascend.py b/lmdeploy/pytorch/engine/devices/ascend.py
@@ -17,7 +17,7 @@ def update_step_context(cls, step_context):
             single_attention_mask = torch.logical_not(
                 torch.tril(
                     torch.ones(step_context.q_seq_length[i],
-                               (step_context.kv_seq_length[i] + 31) & (~31),
+                               step_context.block_offsets.shape[1] * block_size,
                                dtype=torch.bool).cuda(),
                     diagonal=step_context.kv_seq_length[i] -
                     step_context.q_seq_length[i],