Model: Add option to select backend

Changing the backend switches the container that's used.

Signed-off-by: kingbri <8082010+kingbri1@users.noreply.github.com>
This commit is contained in:
kingbri 2025-04-27 22:27:26 -04:00
parent 242f6b7d2a
commit 7c6a053747
4 changed files with 38 additions and 6 deletions

View file

@ -74,6 +74,10 @@ model:
# Example: ['max_seq_len', 'cache_mode'].
use_as_default: []
# Backend to use for the model (default: exllamav2)
# Options: exllamav2, exllamav3
backend: exllamav2
# Max sequence length (default: Empty).
# Fetched from the model's base sequence length in config.json by default.
max_seq_len: