We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent db7fbe6 commit 6e53620Copy full SHA for 6e53620
vllm_ascend/sample/rejection_sampler.py
@@ -147,8 +147,8 @@ def rejection_sample(
147
assert bonus_token_ids.is_contiguous()
148
assert target_probs.shape == (num_tokens, vocab_size)
149
150
- #Switch of Block Verify: when MTP>=2, using block verify for rejection sampler.
151
- using_block_verify = max_spec_len >= 2
+ #Switch of Block Verify: when MTP>=3, using block verify for rejection sampler.
+ using_block_verify = max_spec_len >= 3
152
153
# Create output buffer.
154
output_token_ids = torch.empty(
0 commit comments