增加缓存层提高性能

This commit is contained in:
UnCLAS-Prommer
2025-08-09 11:40:29 +08:00
parent 2ea4c75e9c
commit d65f90ee49
2 changed files with 14 additions and 9 deletions

View File

@@ -1,5 +1,4 @@
import re
import copy
import asyncio
import time
@@ -249,7 +248,7 @@ class LLMRequest:
)
model_info = model_config.get_model_info(least_used_model_name)
api_provider = model_config.get_provider(model_info.api_provider)
client = client_registry.get_client_class(api_provider.client_type)(copy.deepcopy(api_provider))
client = client_registry.get_client_class_instance(api_provider)
logger.debug(f"选择请求模型: {model_info.name}")
total_tokens, penalty, usage_penalty = self.model_usage[model_info.name]
self.model_usage[model_info.name] = (total_tokens, penalty, usage_penalty + 1) # 增加使用惩罚值防止连续使用