feat: workflows for formatting/linting (#35)

* add github workflows for pylint and yapf * yapf * docstrings for auth * fix auth.py * fix generators.py * fix gen_logging.py * fix main.py * fix model.py * fix templating.py * fix utils.py * update formatting.sh to include subdirs for pylint * fix model_test.py * fix wheel_test.py * rename utils to utils_oai * fix OAI/utils_oai.py * fix completion.py * fix token.py * fix lora.py * fix common.py * add pylintrc and fix model.py * finish up pylint * fix attribute error * main.py formatting * add formatting batch script * Main: Remove unnecessary global Linter suggestion. Signed-off-by: kingbri <bdashore3@proton.me> * switch to ruff * Formatting + Linting: Add ruff.toml Signed-off-by: kingbri <bdashore3@proton.me> * Formatting + Linting: Switch scripts to use ruff Also remove the file and recent file change functions from both scripts. Signed-off-by: kingbri <bdashore3@proton.me> * Tree: Format and lint Signed-off-by: kingbri <bdashore3@proton.me> * Scripts + Workflows: Format Signed-off-by: kingbri <bdashore3@proton.me> * Tree: Remove pylint flags We use ruff now Signed-off-by: kingbri <bdashore3@proton.me> * Tree: Format Signed-off-by: kingbri <bdashore3@proton.me> * Formatting: Line length is 88 Use the same value as Black. Signed-off-by: kingbri <bdashore3@proton.me> * Tree: Format Update to new line length rules. Signed-off-by: kingbri <bdashore3@proton.me> --------- Authored-by: AlpinDale <52078762+AlpinDale@users.noreply.github.com> Co-authored-by: kingbri <bdashore3@proton.me>
2023-12-22 16:20:35 +00:00 · 2023-12-22 16:20:35 +00:00 · fa47f51f85
commit fa47f51f85
parent a14abfe21c
22 changed files with 1210 additions and 511 deletions
--- a/OAI/types/model.py
+++ b/OAI/types/model.py
@ -1,19 +1,29 @@
-from pydantic import BaseModel, Field, ConfigDict
+""" Contains model card types. """
 from time import time
 from typing import List, Optional
+
+from pydantic import BaseModel, Field, ConfigDict
+
 from gen_logging import LogConfig

+
 class ModelCardParameters(BaseModel):
-    # Safe to do this since it's guaranteed to fetch a max seq len from model_container
+    """Represents model card parameters."""
+
+    # Safe to do this since it's guaranteed to fetch a max seq len
+    # from model_container
    max_seq_len: Optional[int] = None
    rope_scale: Optional[float] = 1.0
    rope_alpha: Optional[float] = 1.0
    cache_mode: Optional[str] = "FP16"
    prompt_template: Optional[str] = None
    num_experts_per_token: Optional[int] = None
-    draft: Optional['ModelCard'] = None
+    draft: Optional["ModelCard"] = None
+

 class ModelCard(BaseModel):
+    """Represents a single model card."""
+
    id: str = "test"
    object: str = "model"
    created: int = Field(default_factory=lambda: int(time()))
@ -21,26 +31,47 @@ class ModelCard(BaseModel):
    logging: Optional[LogConfig] = None
    parameters: Optional[ModelCardParameters] = None

+
 class ModelList(BaseModel):
+    """Represents a list of model cards."""
+
    object: str = "list"
    data: List[ModelCard] = Field(default_factory=list)

+
 class DraftModelLoadRequest(BaseModel):
+    """Represents a draft model load request."""
+
    draft_model_name: str
    draft_rope_scale: Optional[float] = 1.0
-    draft_rope_alpha: Optional[float] = Field(description = "Automatically calculated if not present", default = None)
+    draft_rope_alpha: Optional[float] = Field(
+        description="Automatically calculated if not present", default=None
+    )
+

 # TODO: Unify this with ModelCardParams
 class ModelLoadRequest(BaseModel):
+    """Represents a model load request."""
+
    name: str

    # Max seq len is fetched from config.json of the model by default
-    max_seq_len: Optional[int] = Field(description = "Leave this blank to use the model's base sequence length", default = None)
-    override_base_seq_len: Optional[int] = Field(description = "Overrides the model's base sequence length. Leave blank if unsure", default = None)
+    max_seq_len: Optional[int] = Field(
+        description="Leave this blank to use the model's base sequence length",
+        default=None,
+    )
+    override_base_seq_len: Optional[int] = Field(
+        description=(
+            "Overrides the model's base sequence length. " "Leave blank if unsure"
+        ),
+        default=None,
+    )
    gpu_split_auto: Optional[bool] = True
    gpu_split: Optional[List[float]] = Field(default_factory=list)
    rope_scale: Optional[float] = 1.0
-    rope_alpha: Optional[float] = Field(description = "Automatically calculated if not present", default = None)
+    rope_alpha: Optional[float] = Field(
+        description="Automatically calculated if not present", default=None
+    )
    no_flash_attention: Optional[bool] = False
    # low_mem: Optional[bool] = False
    cache_mode: Optional[str] = "FP16"
@ -48,9 +79,12 @@ class ModelLoadRequest(BaseModel):
    num_experts_per_token: Optional[int] = None
    draft: Optional[DraftModelLoadRequest] = None

+
 class ModelLoadResponse(BaseModel):
+    """Represents a model load response."""
+
    # Avoids pydantic namespace warning
-    model_config = ConfigDict(protected_namespaces = [])
+    model_config = ConfigDict(protected_namespaces=[])

    model_type: str = "model"
    module: int