Initial

2023-11-09 21:27:45 -06:00 · 2023-11-09 21:27:45 -06:00 · b967e2e604
commit b967e2e604
4 changed files with 80 additions and 0 deletions
--- a/main.py
+++ b/main.py
@ -0,0 +1,39 @@
+# main.py
+
+from fastapi import FastAPI, HTTPException
+from pydantic import BaseModel
+from llm import ModelManager
+from uvicorn import run
+
+app = FastAPI()
+
+# Example: Using a different model directory
+modelManager = ModelManager("/home/david/Models/SynthIA-7B-v2.0-5.0bpw-h6-exl2")
+
+class TextRequest(BaseModel):
+    model: str
+    messages: list[dict]
+    temperature: float
+
+class TextResponse(BaseModel):
+    response: str
+    generation_time: str
+
+@app.post("/generate-text", response_model=TextResponse)
+def generate_text(request: TextRequest):
+    try:
+        #model_path = request.model  # You can use this path to load a specific model if needed
+        messages = request.messages
+        #temperature = request.temperature
+
+        # Assuming you need to extract the user's message from the messages list
+        user_message = next(msg["content"] for msg in messages if msg["role"] == "user")
+
+        # You can then use user_message as the prompt for generation
+        output, generation_time = modelManager.generate_text(user_message)
+        return {"response": output, "generation_time": generation_time}
+    except RuntimeError as e:
+        raise HTTPException(status_code=500, detail=str(e))
+
+if __name__ == "__main__":
+    run(app, host="0.0.0.0", port=8012, reload=True)