模型调优,数据集参数修改
This commit is contained in:
parent
94f6f4c38f
commit
7fe7494e7d
@ -89,15 +89,29 @@ public class AsyncModelServiceService {
|
||||
* quantization:"float16"
|
||||
* replicas:1
|
||||
*/
|
||||
/**
|
||||
* {
|
||||
* "model": "string",
|
||||
* "inferredType": "gpu",
|
||||
* "cpu": 0,
|
||||
* "gpu": 1,
|
||||
* "replicas": 1,
|
||||
* "label": "cpu-aigc-model",
|
||||
* "quantization": "float16",
|
||||
* "maxGpuMemory": 0,
|
||||
* "modelWorker": ""
|
||||
* }
|
||||
*/
|
||||
ModelServiceDO modelServiceDO = modelServiceMapper.selectById(updateObj.getId());
|
||||
AigcModelDeploySaveReq aigcModelDeploySaveReq = new AigcModelDeploySaveReq(1,
|
||||
AigcModelDeploySaveReq aigcModelDeploySaveReq = new AigcModelDeploySaveReq(modelServiceDO.getBaseModelName(),
|
||||
1,
|
||||
updateObj.getGpuCount(),
|
||||
"cpu",
|
||||
"cpu-aigc-model",
|
||||
0,
|
||||
"",
|
||||
"float16", 1);
|
||||
AigcRespVO aigcRespVO = trainHttpService.modelDeploy(new HashMap<>(), aigcModelDeploySaveReq,modelServiceDO.getJobId());
|
||||
AigcRespVO aigcRespVO = trainHttpService.modelDeploy(new HashMap<>(), aigcModelDeploySaveReq);
|
||||
if (aigcRespVO.isSuccess()){
|
||||
updateObj.setStatus(1);
|
||||
}else {
|
||||
|
@ -240,11 +240,10 @@ public class TrainHttpService {
|
||||
return res;
|
||||
}
|
||||
|
||||
public AigcRespVO modelDeploy(Map<String, String> headers,AigcModelDeploySaveReq req,Long jobId){
|
||||
public AigcRespVO modelDeploy(Map<String, String> headers,AigcModelDeploySaveReq req){
|
||||
login(headers);
|
||||
String modelDeploy = llmBackendProperties.getModelDeploy();
|
||||
String url = String.format(modelDeploy,jobId);
|
||||
String res = HttpUtils.post(url, headers, JSON.toJSONString(req));
|
||||
String res = HttpUtils.post(modelDeploy, headers, JSON.toJSONString(req));
|
||||
log.info(" modelDeploy:{}", res);
|
||||
AigcRespVO aigcRespVO = JSON.parseObject(res, AigcRespVO.class);
|
||||
return aigcRespVO;
|
||||
|
@ -18,6 +18,8 @@ public class AigcModelDeploySaveReq {
|
||||
* quantization:"float16"
|
||||
* replicas:1
|
||||
*/
|
||||
|
||||
private String model;
|
||||
private Integer cpu;
|
||||
private Integer gpu;
|
||||
/**
|
||||
|
@ -293,7 +293,7 @@ llm:
|
||||
# 模型部署
|
||||
model_create: http://36.103.199.104:9000/api/models
|
||||
# 模型部署
|
||||
model_deploy: http://36.103.199.104:9000/api/models/%s/deploy
|
||||
model_deploy: http://36.103.199.104:5123/llm/deploy
|
||||
# 取消模型
|
||||
model_undeploy: http://36.103.199.104:9000/api/models/%s/undeploy
|
||||
#### 大模型对话
|
||||
|
Loading…
x
Reference in New Issue
Block a user