Skip to content

Commit 27cf6cc

Browse files
committed
feat: add multi stream concurrent execution for rec_model
1 parent 138caf7 commit 27cf6cc

12 files changed

+1035
-3
lines changed

xllm/core/common/global_flags.cpp

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -478,6 +478,17 @@ DEFINE_bool(enable_constrained_decoding,
478478
"that the output meets specific format or structural requirements "
479479
"through pre-defined rules.");
480480

481+
// --- concurrent llm worker config ---
482+
DEFINE_uint32(llm_worker_max_concurrency,
483+
1,
484+
"Concurrency for llm worker parallel execution. Less than or "
485+
"equal to 1 means disable concurrent llm worker.");
486+
487+
// --- fixedsteps scheduler config ---
488+
DEFINE_bool(enable_fixedsteps_scheduler,
489+
false,
490+
"Whether to use fixsteps scheduler.");
491+
481492
#if defined(USE_NPU)
482493
DEFINE_string(
483494
npu_kernel_backend,

xllm/core/common/global_flags.h

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -235,6 +235,9 @@ DECLARE_double(dit_cache_residual_diff_threshold);
235235

236236
DECLARE_bool(enable_constrained_decoding);
237237

238+
DECLARE_uint32(llm_worker_max_concurrency);
239+
240+
DECLARE_bool(enable_fixedsteps_scheduler);
238241
#if defined(USE_NPU)
239242
DECLARE_string(npu_kernel_backend);
240243
#endif

xllm/core/runtime/CMakeLists.txt

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ cc_library(
1818
worker.h
1919
worker_impl.h
2020
llm_worker_impl.h
21+
concurrent_llm_worker_impl.h
2122
vlm_worker_impl.h
2223
dit_worker.h
2324
embed_worker_impl.h
@@ -34,6 +35,7 @@ cc_library(
3435
worker.cpp
3536
worker_impl.cpp
3637
llm_worker_impl.cpp
38+
concurrent_llm_worker_impl.cpp
3739
vlm_worker_impl.cpp
3840
dit_worker.cpp
3941
embed_worker_impl.cpp

0 commit comments

Comments
 (0)