Skip to content

Commit 1f885b9

Browse files
authored
Fix qnn runner failure
Differential Revision: D78290436 Pull Request resolved: #12459
1 parent 7c70403 commit 1f885b9

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

examples/qualcomm/oss_scripts/llama/runner/lhd_token_generator.h

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -51,9 +51,9 @@ class LhdTokenGenerator : public TokenGenerator {
5151
metadata.use_int64_token},
5252
stats),
5353
metadata_(metadata),
54-
ngrams_pool_(metadata.vocab_size, metadata.ngram, metadata.gcap),
5554
lhd_branch_(metadata.ngram - 1, std::vector<int32_t>(metadata.window)),
56-
lhd_branch_prev_(metadata.window) {
55+
lhd_branch_prev_(metadata.window),
56+
ngrams_pool_(metadata.vocab_size, metadata.ngram, metadata.gcap) {
5757
ET_LOG(
5858
Info,
5959
"Use Lookahead decoding: ngram=%d, window=%d, gcap=%d",

examples/qualcomm/oss_scripts/llama/runner/token_generator.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -27,8 +27,8 @@ TokenGenerator::TokenGenerator(
2727
kv_manager_(kv_manager),
2828
method_name_(method_name),
2929
eos_ids_(std::move(eos_ids)),
30-
metadata_(metadata),
31-
stats_(stats) {
30+
stats_(stats),
31+
metadata_(metadata) {
3232
k_cache_in_.resize(metadata_.num_layers);
3333
v_cache_in_.resize(metadata_.num_layers);
3434
k_cache_out_.resize(metadata_.num_layers);

0 commit comments

Comments
 (0)