修改硅基智能模型推理能力代码

This commit is contained in:
Samon Yu 2025-04-17 22:42:06 +08:00
parent 705064d747
commit 2a5d6e20cf
1 changed files with 15 additions and 32 deletions

View File

@ -1409,44 +1409,27 @@ for model in [m for m in AVAIL_LLM_MODELS if m.startswith("siliconflow-")]:
try: try:
siliconflow_noui, siliconflow_ui = get_predict_function( siliconflow_noui, siliconflow_ui = get_predict_function(
api_key_conf_name="SILICONFLOW_API_KEY", api_key_conf_name="SILICONFLOW_API_KEY",
max_output_token=8192, # max_tokens 的说明https://docs.siliconflow.cn/cn/faqs/misc
max_output_token=4096,
disable_proxy=False, disable_proxy=False,
# 去除前缀 # 去除前缀
model_remove_prefix = ["siliconflow-"] model_remove_prefix = ["siliconflow-"]
) )
# 判断是否具有推理能力 # 判断是否具有推理能力
enable_reasoning = any(item in model for item in inference_model_series) enable_reasoning = any(item in model for item in inference_model_series)
if enable_reasoning: model_info.update(
model_info.update( {
{ model: {
model: { "fn_with_ui": siliconflow_ui,
"fn_with_ui": siliconflow_ui, "fn_without_ui": siliconflow_noui,
"fn_without_ui": siliconflow_noui, "endpoint": siliconflow_endpoint,
"endpoint": siliconflow_endpoint, "can_multi_thread": True,
"can_multi_thread": True, "enable_reasoning": enable_reasoning,
"max_token": 32000, },
"tokenizer": tokenizer_gpt35, }
"token_cnt": get_token_num_gpt35, )
"enable_reasoning": True, logger.info(f" siliconflow 模型 {model} 已加载")
},
}
)
logger.info(f" siliconflow模型 {model} 已加载")
else:
model_info.update(
{
model: {
"fn_with_ui": siliconflow_ui,
"fn_without_ui": siliconflow_noui,
"endpoint": siliconflow_endpoint,
"can_multi_thread": True,
"max_token": 32000,
"tokenizer": tokenizer_gpt35,
"token_cnt": get_token_num_gpt35,
},
}
)
logger.info(f" siliconflow模型 {model} 已加载")
except: except:
logger.error(trimmed_format_exc()) logger.error(trimmed_format_exc())