fix(llm): 修复模型部署失败时的状态更新问题
- 在 AsyncModelServiceService 和 BaseModelTaskService 中添加对部署失败的处理逻辑 - 修改 TrainHttpService 中的 modelDeploy 方法,增加错误处理和状态码检查 - 优化日志记录,便于排查问题
This commit is contained in:
parent
4b6fa46354
commit
0a1b8dcf0a
@ -84,9 +84,14 @@ public class AsyncModelServiceService {
|
||||
AigcModelDeploySaveReq aigcModelDeploySaveReq = new AigcModelDeploySaveReq(modelServiceDO.getBaseModelName(),
|
||||
"gpu");
|
||||
ModelDeployRespVO modelDeployRespVO = trainHttpService.modelDeploy(new HashMap<>(), aigcModelDeploySaveReq);
|
||||
updateObj.setStatus(1);
|
||||
updateObj.setJobId(modelDeployRespVO.getId());
|
||||
updateObj.setModelUrl(modelDeployRespVO.getPort()+DEFAULT_MODEL_URL_SUFFIX);
|
||||
if (modelDeployRespVO.getMessage().equals("error")){
|
||||
updateObj.setStatus(3);
|
||||
}else {
|
||||
updateObj.setStatus(1);
|
||||
updateObj.setJobId(modelDeployRespVO.getId());
|
||||
updateObj.setModelUrl(modelDeployRespVO.getPort()+DEFAULT_MODEL_URL_SUFFIX);
|
||||
}
|
||||
|
||||
modelServiceMapper.updateById(updateObj);
|
||||
}catch(Exception e){
|
||||
// updateObj.setStatus(3);
|
||||
|
@ -60,11 +60,13 @@ public class BaseModelTaskService {
|
||||
AigcModelDeploySaveReq aigcModelDeploySaveReq = new AigcModelDeploySaveReq(baseModelDO.getAigcModelName(),
|
||||
"gpu");
|
||||
ModelDeployRespVO modelDeployRespVO = trainHttpService.modelDeploy(new HashMap<>(), aigcModelDeploySaveReq);
|
||||
BaseModelSaveReqVO baseModelSaveReqVO = new BaseModelSaveReqVO();
|
||||
baseModelSaveReqVO.setId(baseModelDO.getId());
|
||||
baseModelSaveReqVO.setModelId(modelDeployRespVO.getId());
|
||||
baseModelSaveReqVO.setChatUrl(modelDeployRespVO.getPort() + DEFAULT_MODEL_URL_SUFFIX);
|
||||
baseModelService.updateBaseModel(new BaseModelSaveReqVO());
|
||||
if (!modelDeployRespVO.getMessage().equals("error")) {
|
||||
BaseModelSaveReqVO baseModelSaveReqVO = new BaseModelSaveReqVO();
|
||||
baseModelSaveReqVO.setId(baseModelDO.getId());
|
||||
baseModelSaveReqVO.setModelId(modelDeployRespVO.getId());
|
||||
baseModelSaveReqVO.setChatUrl(modelDeployRespVO.getPort() + DEFAULT_MODEL_URL_SUFFIX);
|
||||
baseModelService.updateBaseModel(new BaseModelSaveReqVO());
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
@ -244,7 +244,15 @@ public class TrainHttpService {
|
||||
log.info(" modelDeploy request:{}", JSON.toJSONString(req));
|
||||
String res = HttpUtils.post(modelDeploy, headers, JSON.toJSONString(req));
|
||||
log.info(" modelDeploy:{}", res);
|
||||
ModelDeployRespVO modelDeployRespVO = JSON.parseObject(res.getBytes(), ModelDeployRespVO.class);
|
||||
JSONObject parseObject = JSON.parseObject(res);
|
||||
ModelDeployRespVO modelDeployRespVO=new ModelDeployRespVO();
|
||||
|
||||
if(parseObject.getString("res").contains("error")){
|
||||
modelDeployRespVO.setMessage("error");
|
||||
return modelDeployRespVO;
|
||||
}
|
||||
modelDeployRespVO = JSON.parseObject(res.getBytes(), ModelDeployRespVO.class);
|
||||
|
||||
return modelDeployRespVO;
|
||||
}
|
||||
public AigcModelDeployVO modelUndeploy(Map<String, String> headers, Long deployId) {
|
||||
|
Loading…
x
Reference in New Issue
Block a user