Skip to content

Commit 1677e90

Browse files
authored
Merge pull request #1439 from kvcache-ai/qiyuxinlin-patch-3
Update balance_serve.py
2 parents dc59af6 + a2e95e4 commit 1677e90

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

ktransformers/server/backend/interfaces/balance_serve.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -445,7 +445,7 @@ async def inference(self, local_messages, thread_id: str, temperature: Optional[
445445
query_add.query_length = query_length
446446
profiler.set_counter("prefill", query_length)
447447
#@TODO add server
448-
stop_criteria = [self.tokenizer.encode(self.tokenizer.eos_token, add_special_tokens=False),self.tokenizer.encode("<|im_end|>")]
448+
stop_criteria = [self.tokenizer.encode(self.tokenizer.eos_token, add_special_tokens=False),self.tokenizer.encode("<|im_end|>", add_special_tokens=True)]
449449
query_add.stop_criteria = stop_criteria
450450

451451
temperature, top_p, max_new_tokens = self.get_params(temperature, top_p, max_tokens, max_completion_tokens)

0 commit comments

Comments
 (0)