修改硅基智能模型推理能力代码

This commit is contained in:
Samon Yu 2025-04-17 22:42:06 +08:00
parent 705064d747
commit 2a5d6e20cf
1 changed files with 15 additions and 32 deletions

View File

@ -1409,14 +1409,14 @@ for model in [m for m in AVAIL_LLM_MODELS if m.startswith("siliconflow-")]:
try: try:
siliconflow_noui, siliconflow_ui = get_predict_function( siliconflow_noui, siliconflow_ui = get_predict_function(
api_key_conf_name="SILICONFLOW_API_KEY", api_key_conf_name="SILICONFLOW_API_KEY",
max_output_token=8192, # max_tokens 的说明https://docs.siliconflow.cn/cn/faqs/misc
max_output_token=4096,
disable_proxy=False, disable_proxy=False,
# 去除前缀 # 去除前缀
model_remove_prefix = ["siliconflow-"] model_remove_prefix = ["siliconflow-"]
) )
# 判断是否具有推理能力 # 判断是否具有推理能力
enable_reasoning = any(item in model for item in inference_model_series) enable_reasoning = any(item in model for item in inference_model_series)
if enable_reasoning:
model_info.update( model_info.update(
{ {
model: { model: {
@ -1424,29 +1424,12 @@ for model in [m for m in AVAIL_LLM_MODELS if m.startswith("siliconflow-")]:
"fn_without_ui": siliconflow_noui, "fn_without_ui": siliconflow_noui,
"endpoint": siliconflow_endpoint, "endpoint": siliconflow_endpoint,
"can_multi_thread": True, "can_multi_thread": True,
"max_token": 32000, "enable_reasoning": enable_reasoning,
"tokenizer": tokenizer_gpt35,
"token_cnt": get_token_num_gpt35,
"enable_reasoning": True,
}, },
} }
) )
logger.info(f" siliconflow模型 {model} 已加载") logger.info(f" siliconflow 模型 {model} 已加载")
else:
model_info.update(
{
model: {
"fn_with_ui": siliconflow_ui,
"fn_without_ui": siliconflow_noui,
"endpoint": siliconflow_endpoint,
"can_multi_thread": True,
"max_token": 32000,
"tokenizer": tokenizer_gpt35,
"token_cnt": get_token_num_gpt35,
},
}
)
logger.info(f" siliconflow模型 {model} 已加载")
except: except:
logger.error(trimmed_format_exc()) logger.error(trimmed_format_exc())