From 33dcc4c152d580b3e701ef5b345f8813fadb8977 Mon Sep 17 00:00:00 2001 From: Soulter <905617992@qq.com> Date: Sat, 30 Sep 2023 15:06:57 +0800 Subject: [PATCH] =?UTF-8?q?perf:=20openai=E6=A8=A1=E5=9E=8B=E8=B6=85?= =?UTF-8?q?=E9=99=90=E6=97=B6=E6=88=AA=E6=96=AD=E6=B6=88=E6=81=AF=EF=BC=88?= =?UTF-8?q?0.75x=EF=BC=89?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- model/provider/provider_openai_official.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/model/provider/provider_openai_official.py b/model/provider/provider_openai_official.py index 978f1f870..2e7e6987e 100644 --- a/model/provider/provider_openai_official.py +++ b/model/provider/provider_openai_official.py @@ -139,9 +139,11 @@ class ProviderOpenAIOfficial(Provider): else: break elif 'maximum context length' in str(e): - gu.log("token超限, 清空对应缓存") + gu.log("token超限, 清空对应缓存,并进行消息0.75倍截断") self.session_dict[session_id] = [] + prompt = prompt[:int(len(prompt)*0.75)] cache_data_list, new_record, req = self.wrap(prompt, session_id) + elif 'Limit: 3 / min. Please try again in 20s.' in str(e) or "OpenAI response error" in str(e): time.sleep(30) else: