Browse Source

Merge pull request '#2501 自定义镜像的npu训练任务创建新版本会Failed' (#2503) from zouap into V20220718

Reviewed-on: https://git.openi.org.cn/OpenI/aiforge/pulls/2503
Reviewed-by: lewis <747342561@qq.com>
pull/2526/head
lewis 2 years ago
parent
commit
510369112b
1 changed files with 7 additions and 1 deletions
  1. +7
    -1
      routers/repo/modelarts.go

+ 7
- 1
routers/repo/modelarts.go View File

@@ -1220,7 +1220,13 @@ func getUserCommand(engineId int, req *modelarts.GenerateTrainJobReq) (string, s
userImageUrl := "" userImageUrl := ""
userCommand := "" userCommand := ""
if engineId < 0 { if engineId < 0 {
userCommand = "/bin/bash /home/work/run_train.sh 's3://" + req.CodeObsPath + "' 'code/" + req.BootFile + "' '/tmp/log/train.log' --'data_url'='s3://" + req.DataUrl + "' --'train_url'='s3://" + req.TrainUrl + "'"
tmpCodeObsPath := strings.Trim(req.CodeObsPath, "/")
tmpCodeObsPaths := strings.Split(tmpCodeObsPath, "/")
lastCodeDir := "code"
if len(tmpCodeObsPaths) > 0 {
lastCodeDir = tmpCodeObsPaths[len(tmpCodeObsPaths)-1]
}
userCommand = "/bin/bash /home/work/run_train.sh 's3://" + req.CodeObsPath + "' '" + lastCodeDir + "/" + req.BootFile + "' '/tmp/log/train.log' --'data_url'='s3://" + req.DataUrl + "' --'train_url'='s3://" + req.TrainUrl + "'"
var versionInfos modelarts.VersionInfo var versionInfos modelarts.VersionInfo
if err := json.Unmarshal([]byte(setting.EngineVersions), &versionInfos); err != nil { if err := json.Unmarshal([]byte(setting.EngineVersions), &versionInfos); err != nil {
log.Info("json parse err." + err.Error()) log.Info("json parse err." + err.Error())


Loading…
Cancel
Save