From d9caf9acce2057297ff56ca564cdb93eb3def2ba Mon Sep 17 00:00:00 2001 From: Tiger Ren Date: Wed, 20 Nov 2024 15:52:38 +0800 Subject: [PATCH] =?UTF-8?q?=E7=9F=A5=E8=AF=86=E5=BA=93retrival=E4=BD=BF?= =?UTF-8?q?=E7=94=A8glm-4-plus,=E5=B9=B6=E4=B8=94=E8=AE=BE=E7=BD=AEmax=5Ft?= =?UTF-8?q?okens=3D4095?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- app/services/zhipu_kb_service.py | 16 +++++++++------- 1 file changed, 9 insertions(+), 7 deletions(-) diff --git a/app/services/zhipu_kb_service.py b/app/services/zhipu_kb_service.py index b0cba2c..b7c8a20 100644 --- a/app/services/zhipu_kb_service.py +++ b/app/services/zhipu_kb_service.py @@ -7,7 +7,7 @@ logger = logging.getLogger(__name__) class ZhipuKbService: def __init__(self): - self.model_name = "glm-4" + self.model_name = "glm-4-plus" self.app_secret_key = "d54f764a1d67c17d857bd3983b772016.GRjowY0fyiMNurLc" logger.info("ZhipuKbService initialized with model: %s", self.model_name) @@ -22,7 +22,7 @@ class ZhipuKbService: prompt_template = default_prompt try: response = client.chat.completions.create( - model="glm-4", + model=self.model_name, messages=[ {"role": "user", "content": message}, ], @@ -36,8 +36,9 @@ class ZhipuKbService: } ], stream=False, - temperature=0.01, - top_p=0.1, + max_tokens=4095, + temperature=0.01, # default=0.01 + top_p=0.1, #default=0.1 ) result = response.choices[0].message.content end_time = time.time() @@ -59,7 +60,7 @@ class ZhipuKbService: prompt_template = default_prompt try: response = client.chat.completions.create( - model="glm-4", + model=self.model_name, messages=messages, tools=[ { @@ -71,8 +72,9 @@ class ZhipuKbService: } ], stream=True, - temperature=0.01, - top_p=0.1, + max_tokens=4095, + temperature=0.01, # default=0.01 + top_p=0.1, #default=0.1 ) for chunk in response: yield chunk.choices[0].delta.content