Tree: Format

This commit is contained in:
DocShotgun 2024-05-26 15:48:18 -07:00
parent 767e6a798a
commit 7ab7ffd562
2 changed files with 2 additions and 4 deletions

View file

@ -85,7 +85,7 @@ def add_model_args(parser: argparse.ArgumentParser):
model_group.add_argument(
"--cache-size",
type=int,
help="The size of the prompt cache (in number of tokens) to allocate"
help="The size of the prompt cache (in number of tokens) to allocate",
)
model_group.add_argument(
"--rope-scale", type=float, help="Sets rope_scale or compress_pos_emb"

View file

@ -74,9 +74,7 @@ class ModelLoadRequest(BaseModel):
examples=[4096],
)
cache_size: Optional[int] = Field(
description=(
"Number in tokens, must be greater than or equal to max_seq_len"
),
description=("Number in tokens, must be greater than or equal to max_seq_len"),
default=None,
examples=[4096],
)