Merge pull request #346 from gakada/main

Exl3: some models aren't functional without add_bos?
This commit is contained in:
Brian 2025-05-17 22:05:15 -04:00 committed by GitHub
commit 729caaeddc
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -844,7 +844,7 @@ class ExllamaV3Container(BaseModelContainer):
job = AsyncJob(
self.generator,
sampler=sampler,
input_ids=self.tokenizer.encode(prompt, add_bos=False),
input_ids=input_ids,
max_new_tokens=max_tokens,
stop_conditions=stop_conditions,
banned_strings=params.banned_strings,