Skip to content

Commit 5e9e1a4

Browse files
taoruichengtaoruicheng
andauthored
fix: 修复使用中遇到的bug (#45)
* fix: 修复推理服务分页查询时的参数顺序异常问题,并增加根据状态过滤的逻辑 * fix: 修复大模型优化提示词的bug --------- Co-authored-by: taoruicheng <taoruicheng@sensetime>
1 parent 1ad9ead commit 5e9e1a4

3 files changed

Lines changed: 23 additions & 15 deletions

File tree

back/src/parts/app/workflow_api.py

Lines changed: 13 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -772,26 +772,26 @@ def post(self):
772772
我需要你帮过滤用户的请求,判断请求是否和大模型提示语(prompt)有关
773773
774774
## 技能
775-
精准判断用户输入是否与生成大模型提示语(prompt)有关,若有关回复1,若无关恢复2
775+
精准判断用户输入是否与生成大模型提示语(prompt)有关,若有关回复:和prompt有关,若无关回复:和prompt无关
776776
777777
## 回复格式要求
778-
- 仅回复1或2
778+
- 仅回复"和prompt有关"或"和prompt无关"
779779
780780
### 示例
781781
#### 示例 1
782782
输入: 我感觉好无聊呀
783-
输出: 2
783+
输出: 和prompt无关
784784
785785
#### 示例 2
786786
输入: 帮我写个提示语,与医学科普相关
787-
输出: 1
787+
输出: 和prompt有关
788788
789789
#### 示例 3
790790
输入: 你是谁
791-
输出: 2
791+
输出: 和prompt无关
792792
793793
### 限制
794-
- 若遇到难以理解或把握不准的,统一回复2
794+
- 若遇到难以理解或把握不准的,统一回复: 和prompt无关
795795
"""
796796
prompt = """
797797
## 任务
@@ -830,10 +830,11 @@ def post(self):
830830
}, 400
831831
filter = llm.share(filter_prompt)
832832
filte_res = filter(query)
833-
if "2" in filte_res:
834-
ret = "输入与生成提示语无关,请重新组织语言"
835-
else:
833+
if "和prompt有关" in filte_res:
836834
ret = llm(query)
835+
else:
836+
ret = "输入与生成提示语无关,请重新组织语言。示例:帮我写个提示语,与医学科普相关。"
837+
837838
else:
838839
model = LazymodelOnlineModels.query.filter_by(
839840
model_key=model_name
@@ -855,10 +856,10 @@ def post(self):
855856
).prompt(prompt)
856857
filter = llm.share(filter_prompt)
857858
filte_res = filter(query)
858-
if "2" in filte_res:
859-
ret = "输入与生成提示语无关,请重新组织语言"
860-
else:
859+
if "和prompt有关" in filte_res:
861860
ret = llm(query)
861+
else:
862+
ret = "输入与生成提示语无关,请重新组织语言。示例:帮我写个提示语,与医学科普相关。"
862863
except Exception as e:
863864
msg = f"发生错误:{e}"
864865
msg = msg.replace("400 Bad Request:", "")

back/src/parts/inferservice/controller.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -95,8 +95,9 @@ def post(self):
9595
status = data.get("status", [])
9696
user_id = data.get("user_id", [])
9797
tenant = data.get("tenant", "")
98+
# 调用InferService获取服务列表和分页信息
9899
result, pagination_info = self.infer_service.list_infer_model_service(
99-
page, per_page, qtype, search_name, status, user_id, tenant
100+
page=page, per_page=per_page, qtype=qtype, search_name=search_name, status=status, user_id=user_id, tenant=tenant
100101
)
101102

102103
return build_response(
@@ -221,7 +222,7 @@ def post(self):
221222
return jsonify({"error": "Model not found"})
222223
# 将新建的服务信息以JSON格式返回
223224
self.infer_service.create_infer_model_service(
224-
data.get("group_id"), group_info.model_id, data.get("services"),model_num_gpus
225+
data.get("group_id"), group_info.model_id, data.get("services")
225226
)
226227
return build_response(message="Service created successfully")
227228

back/src/parts/inferservice/service.py

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -392,7 +392,13 @@ def _build_service_info(
392392
service_info_temp["deploy_method"] = get_service_info_map.get(
393393
"framework", ""
394394
)
395-
395+
# 根据status参数过滤服务信息
396+
if status:
397+
service_info = [
398+
info for info in service_info
399+
if info.get("status") in status
400+
]
401+
396402
return service_info
397403

398404
def list_infer_model_service(

0 commit comments

Comments
 (0)