We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 2d98747 commit f7a4465Copy full SHA for f7a4465
tests/integration/defs/accuracy/accuracy_core.py
@@ -303,7 +303,8 @@ class GSM8K(AccuracyTask):
303
MAX_OUTPUT_LEN = 256
304
305
EVALUATOR_CLS = tensorrt_llm.evaluate.GSM8K
306
- EVALUATOR_KWARGS = dict(dataset_path=DATASET_DIR, random_seed=0)
+ EVALUATOR_KWARGS = dict(dataset_path=DATASET_DIR, random_seed=0,
307
+ apply_chat_template=False)
308
309
EVALUATE_KWARGS = dict(scores_filter=None)
310
0 commit comments