We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent f92139f commit 395d3f5Copy full SHA for 395d3f5
examples/models/llama2/runner/runner.cpp
@@ -126,7 +126,7 @@ Error Runner::load() {
126
tokenizer_.get(),
127
text_decoder_runner_.get(),
128
metadata_.at(kUseKVCache),
129
- enable_parallel_prefill_);
+ metadata_.at(kEnableDynamicShape));
130
131
text_token_generator_ = std::make_unique<TextTokenGenerator>(
132
examples/models/llama2/runner/runner.h
@@ -45,7 +45,6 @@ class Runner {
45
46
private:
47
float temperature_;
48
- bool enable_parallel_prefill_;
49
bool shouldStop_{false};
50
51
// model
0 commit comments