Model: Fix usage stats in non-streaming gens
The wrong key was being returned from the model to the API. Signed-off-by: kingbri <bdashore3@proton.me>
This commit is contained in:
parent
213430a122
commit
e4bb709305
1 changed files with 1 additions and 1 deletions
|
|
@ -656,7 +656,7 @@ class ExllamaV2Container:
|
|||
joined_generation["prompt_tokens"] = unwrap(
|
||||
generations[-1].get("prompt_tokens"), 0
|
||||
)
|
||||
joined_generation["generation_tokens"] = unwrap(
|
||||
joined_generation["generated_tokens"] = unwrap(
|
||||
generations[-1].get("generated_tokens"), 0
|
||||
)
|
||||
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue