diff --git a/backends/exllamav2/model.py b/backends/exllamav2/model.py index c2a084b..65689f4 100644 --- a/backends/exllamav2/model.py +++ b/backends/exllamav2/model.py @@ -1373,6 +1373,7 @@ class ExllamaV2Container(BaseModelContainer): min_new_tokens=params.min_tokens, gen_settings=gen_settings, stop_conditions=stop_conditions, + decode_special_tokens=True, filters=grammar_handler.filters, filter_prefer_eos=bool(grammar_handler.filters), return_probs=params.logprobs > 0,