OAI: Keep behavior consistent between chat completion and encode

* When vision is not enabled, only the first text block is kept in message.content if it is a list
2024-11-19 12:40:00 -08:00 · 2024-11-19 12:40:00 -08:00 · 731a345cfc
commit 731a345cfc
parent 27d9af50a8
1 changed files with 14 additions and 0 deletions
--- a/endpoints/core/router.py
+++ b/endpoints/core/router.py
@ -379,6 +379,20 @@ async def encode_tokens(data: TokenEncodeRequest) -> TokenEncodeResponse:
        if model.container.use_vision:
            data.text, embeddings = await preprocess_vision_request(data.text)

+        # Keeping behavior consistent with format_prompt_with_template
+        # Deal with list in messages.content
+        # Just replace the content list with the very first text message
+        for message in data.text:
+            if isinstance(message["content"], list):
+                message["content"] = next(
+                    (
+                        content["text"]
+                        for content in message["content"]
+                        if content["type"] == "text"
+                    ),
+                    "",
+                )
+
        special_tokens_dict = model.container.get_special_tokens(
            unwrap(data.add_bos_token, True)
        )