We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 732edd8 commit b05f5efCopy full SHA for b05f5ef
xllm/core/runtime/speculative_worker_impl.cpp
@@ -260,7 +260,7 @@ std::optional<ForwardOutput> SpeculativeWorkerImpl::step_prefill(
260
inputs.micro_inputs[i].input_params.embedding_ids.end());
261
}
262
263
- if (!inputs.concated_sampling_params.selected_token_idxes.defined()) {
+ if (inputs.concated_sampling_params.selected_token_idxes.defined()) {
264
embeddings = embeddings.index_select(
265
/*dim=*/0, inputs.concated_sampling_params.selected_token_idxes);
266
CHECK_EQ(embeddings.size(0), output.sample_output.next_tokens.size(0));
0 commit comments