API: Format and fix message naming

Signed-off-by: kingbri <8082010+kingbri1@users.noreply.github.com>
This commit is contained in:
kingbri 2025-04-28 22:36:30 -04:00
parent 9157be3e34
commit 3960612d38
3 changed files with 9 additions and 17 deletions

View file

@ -328,9 +328,7 @@ async def stream_generate_chat_completion(
for idx in range(0, data.n):
task_gen_params = data.model_copy(deep=True)
request_id = _parse_gen_request_id(
data.n, request.state.id, idx
)
request_id = _parse_gen_request_id(data.n, request.state.id, idx)
gen_task = asyncio.create_task(
_stream_collector(
@ -421,10 +419,10 @@ async def generate_chat_completion(
gen_tasks: List[asyncio.Task] = []
try:
logger.info(f"Received chat completion request {request.state.id}")
for idx in range(0, data.n):
request_id = _parse_gen_request_id(
data.n, request.state.id, idx
)
request_id = _parse_gen_request_id(data.n, request.state.id, idx)
gen_tasks.append(
asyncio.create_task(
@ -491,9 +489,7 @@ async def generate_tool_calls(
data, current_generations
)
request_id = _parse_gen_request_id(
data.n, request.state.id, idx
)
request_id = _parse_gen_request_id(data.n, request.state.id, idx)
gen_tasks.append(
asyncio.create_task(

View file

@ -202,9 +202,7 @@ async def stream_generate_completion(
for idx in range(0, data.n):
task_gen_params = data.model_copy(deep=True)
request_id = _parse_gen_request_id(
data.n, request.state.id, idx
)
request_id = _parse_gen_request_id(data.n, request.state.id, idx)
gen_task = asyncio.create_task(
_stream_collector(
@ -263,13 +261,11 @@ async def generate_completion(
gen_tasks: List[asyncio.Task] = []
try:
logger.info(f"Recieved completion request {request.state.id}")
logger.info(f"Received completion request {request.state.id}")
for idx in range(0, data.n):
task_gen_params = data.model_copy(deep=True)
request_id = _parse_gen_request_id(
data.n, request.state.id, idx
)
request_id = _parse_gen_request_id(data.n, request.state.id, idx)
gen_tasks.append(
asyncio.create_task(

View file

@ -38,7 +38,7 @@ def float_list_to_base64(float_array: np.ndarray) -> str:
async def get_embeddings(data: EmbeddingsRequest, request: Request) -> dict:
model_path = model.embeddings_container.model_dir
logger.info(f"Recieved embeddings request {request.state.id}")
logger.info(f"Received embeddings request {request.state.id}")
if not isinstance(data.input, list):
data.input = [data.input]