[Bugfix] Allow prefill of assistant response when using mistral_common (#9446)
This commit is contained in:
parent
9d30a056e7
commit
5e443b594f
@ -166,6 +166,10 @@ class MistralTokenizer:
|
|||||||
tools: Optional[Dict[str, Any]] = None,
|
tools: Optional[Dict[str, Any]] = None,
|
||||||
**kwargs) -> List[int]:
|
**kwargs) -> List[int]:
|
||||||
|
|
||||||
|
last_message = messages[-1]
|
||||||
|
if last_message["role"] == "assistant":
|
||||||
|
last_message["prefix"] = True
|
||||||
|
|
||||||
request = ChatCompletionRequest(messages=messages,
|
request = ChatCompletionRequest(messages=messages,
|
||||||
tools=tools) # type: ignore[type-var]
|
tools=tools) # type: ignore[type-var]
|
||||||
encoded = self.mistral.encode_chat_completion(request)
|
encoded = self.mistral.encode_chat_completion(request)
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user