Skip to content

Commit e63d49d

Browse files
committed
minor changes
Signed-off-by: leslie-fang25 <[email protected]>
1 parent 6d98f0a commit e63d49d

File tree

2 files changed

+1
-21
lines changed

2 files changed

+1
-21
lines changed

tensorrt_llm/executor/worker.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -788,7 +788,6 @@ def notify_proxy_threads_to_quit():
788788
"green")
789789

790790
try:
791-
print("---- worker_cls is: {}".format(worker_cls), flush=True)
792791
worker: GenerationExecutorWorker = worker_cls(
793792
engine,
794793
executor_config,

tensorrt_llm/llmapi/llm.py

Lines changed: 1 addition & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -37,7 +37,7 @@
3737
from .llm_utils import (CachedModelLoader, KvCacheRetentionConfig,
3838
LlmBuildStats, ModelLoader, _ModelRuntimeContext)
3939
from .mpi_session import MpiPoolSession, external_mpi_comm_available
40-
from .tokenizer import (TokenizerBase, _xgrammar_tokenizer_info)
40+
from .tokenizer import TokenizerBase, _xgrammar_tokenizer_info
4141
# TODO[chunweiy]: move the following symbols back to utils scope, and remove the following import
4242
from .utils import (append_docstring, exception_handler, get_device_count,
4343
print_colored_debug, set_api_status)
@@ -959,27 +959,8 @@ def _build_model(self):
959959

960960
assert isinstance(self.args, TorchLlmArgs)
961961

962-
# self._executor_config = tllm.ExecutorConfig(
963-
# max_beam_width=self.args.max_beam_width,
964-
# scheduler_config=PybindMirror.maybe_to_pybind(
965-
# self.args.scheduler_config),
966-
# max_batch_size=self.args.max_batch_size,
967-
# max_num_tokens=self.args.max_num_tokens,
968-
# gather_generation_logits=self.args.gather_generation_logits,
969-
# fail_fast_on_attention_window_too_large=getattr(
970-
# self.args, 'fail_fast_on_attention_window_too_large', False),
971-
# **kwargs)
972-
973-
# self._executor_config = self.args.get_executor_config(self._hf_model_dir)
974-
975962
# TODO: revisit gather_context_logits
976963
return_logits = self.args.gather_generation_logits
977-
978-
print("---- self._executor_cls is: {}".format(self._executor_cls),
979-
flush=True)
980-
print("---- self._engine_dir is: {}".format(self._engine_dir),
981-
flush=True)
982-
983964
self._executor = self._executor_cls.create(
984965
self._engine_dir,
985966
executor_config=None,

0 commit comments

Comments
 (0)