Exl3: fix add_bos in generator

This commit is contained in:
gakada
2025-05-17 19:10:49 +09:00
committed by GitHub
parent 81170eee00
commit ba6248eec0

View File

@@ -844,7 +844,7 @@ class ExllamaV3Container(BaseModelContainer):
job = AsyncJob(
self.generator,
sampler=sampler,
input_ids=self.tokenizer.encode(prompt, add_bos=False),
input_ids=input_ids,
max_new_tokens=max_tokens,
stop_conditions=stop_conditions,
banned_strings=params.banned_strings,