Browse Source

Merge pull request 'dataMount' (#3395) from dataMount into V20221214

Reviewed-on: https://openi.pcl.ac.cn/OpenI/aiforge/pulls/3395
Reviewed-by: ychao_1983 <ychao_1983@sina.com>
pull/3396/head
ychao_1983 2 years ago
parent
commit
50d500973b
4 changed files with 40 additions and 5 deletions
  1. +15
    -0
      models/cloudbrain.go
  2. +16
    -4
      modules/modelarts/modelarts.go
  3. +3
    -1
      modules/modelarts/resty.go
  4. +6
    -0
      modules/setting/setting.go

+ 15
- 0
models/cloudbrain.go View File

@@ -1061,6 +1061,9 @@ type UserImageConfig struct {
CreateVersion bool `json:"create_version"` CreateVersion bool `json:"create_version"`
Flavor Flavor `json:"flavor"` Flavor Flavor `json:"flavor"`
PoolID string `json:"pool_id"` PoolID string `json:"pool_id"`
ShareAddr string `json:"nas_share_addr"`
MountPath string `json:"nas_mount_path"`
NasType string `json:"nas_type"`
} }


type CreateTrainJobParams struct { type CreateTrainJobParams struct {
@@ -1084,13 +1087,18 @@ type Config struct {
CreateVersion bool `json:"create_version"` CreateVersion bool `json:"create_version"`
Flavor Flavor `json:"flavor"` Flavor Flavor `json:"flavor"`
PoolID string `json:"pool_id"` PoolID string `json:"pool_id"`
ShareAddr string `json:"nas_share_addr"`
MountPath string `json:"nas_mount_path"`
NasType string `json:"nas_type"`
} }

type CreateInferenceJobParams struct { type CreateInferenceJobParams struct {
JobName string `json:"job_name"` JobName string `json:"job_name"`
Description string `json:"job_desc"` Description string `json:"job_desc"`
InfConfig InfConfig `json:"config"` InfConfig InfConfig `json:"config"`
WorkspaceID string `json:"workspace_id"` WorkspaceID string `json:"workspace_id"`
} }

type CreateInfUserImageParams struct { type CreateInfUserImageParams struct {
JobName string `json:"job_name"` JobName string `json:"job_name"`
Description string `json:"job_desc"` Description string `json:"job_desc"`
@@ -1148,6 +1156,9 @@ type TrainJobVersionConfig struct {
Flavor Flavor `json:"flavor"` Flavor Flavor `json:"flavor"`
PoolID string `json:"pool_id"` PoolID string `json:"pool_id"`
PreVersionId int64 `json:"pre_version_id"` PreVersionId int64 `json:"pre_version_id"`
ShareAddr string `json:"nas_share_addr"`
MountPath string `json:"nas_mount_path"`
NasType string `json:"nas_type"`
} }


type TrainJobVersionUserImageConfig struct { type TrainJobVersionUserImageConfig struct {
@@ -1163,6 +1174,9 @@ type TrainJobVersionUserImageConfig struct {
PreVersionId int64 `json:"pre_version_id"` PreVersionId int64 `json:"pre_version_id"`
UserImageUrl string `json:"user_image_url"` UserImageUrl string `json:"user_image_url"`
UserCommand string `json:"user_command"` UserCommand string `json:"user_command"`
ShareAddr string `json:"nas_share_addr"`
MountPath string `json:"nas_mount_path"`
NasType string `json:"nas_type"`
} }


type CreateConfigParams struct { type CreateConfigParams struct {
@@ -1178,6 +1192,7 @@ type CreateConfigParams struct {
LogUrl string `json:"log_url"` LogUrl string `json:"log_url"`
Flavor Flavor `json:"flavor"` Flavor Flavor `json:"flavor"`
PoolID string `json:"pool_id"` PoolID string `json:"pool_id"`
Volumes []Volumes `json:"volumes"`
} }


type Parameter struct { type Parameter struct {


+ 16
- 4
modules/modelarts/modelarts.go View File

@@ -281,7 +281,7 @@ func GenerateTask(ctx *context.Context, jobName, uuid, description, flavor strin
return nil return nil
} }


func GenerateNotebook2(ctx *context.Context, displayJobName, jobName, uuid, description, imageId string, spec *models.Specification, bootFile string,autoStopDurationInMs int64) (string, error) {
func GenerateNotebook2(ctx *context.Context, displayJobName, jobName, uuid, description, imageId string, spec *models.Specification, bootFile string, autoStopDurationInMs int64) (string, error) {
if poolInfos == nil { if poolInfos == nil {
json.Unmarshal([]byte(setting.PoolInfos), &poolInfos) json.Unmarshal([]byte(setting.PoolInfos), &poolInfos)
} }
@@ -379,6 +379,9 @@ func GenerateTrainJob(ctx *context.Context, req *GenerateTrainJobReq) (jobId str
Parameter: req.Parameters, Parameter: req.Parameters,
UserImageUrl: req.UserImageUrl, UserImageUrl: req.UserImageUrl,
UserCommand: req.UserCommand, UserCommand: req.UserCommand,
ShareAddr: setting.ModelArtsShareAddr,
MountPath: setting.ModelArtsMountPath,
NasType: setting.ModelArtsNasType,
}, },
}) })
} else { } else {
@@ -399,6 +402,9 @@ func GenerateTrainJob(ctx *context.Context, req *GenerateTrainJobReq) (jobId str
Code: req.Spec.SourceSpecId, Code: req.Spec.SourceSpecId,
}, },
Parameter: req.Parameters, Parameter: req.Parameters,
ShareAddr: setting.ModelArtsShareAddr,
MountPath: setting.ModelArtsMountPath,
NasType: setting.ModelArtsNasType,
}, },
}) })
} }
@@ -517,6 +523,9 @@ func GenerateTrainJobVersion(ctx *context.Context, req *GenerateTrainJobReq, job
PreVersionId: req.PreVersionId, PreVersionId: req.PreVersionId,
UserImageUrl: req.UserImageUrl, UserImageUrl: req.UserImageUrl,
UserCommand: req.UserCommand, UserCommand: req.UserCommand,
ShareAddr: setting.ModelArtsShareAddr,
MountPath: setting.ModelArtsMountPath,
NasType: setting.ModelArtsNasType,
}, },
}, jobId) }, jobId)
} else { } else {
@@ -536,6 +545,9 @@ func GenerateTrainJobVersion(ctx *context.Context, req *GenerateTrainJobReq, job
}, },
Parameter: req.Parameters, Parameter: req.Parameters,
PreVersionId: req.PreVersionId, PreVersionId: req.PreVersionId,
ShareAddr: setting.ModelArtsShareAddr,
MountPath: setting.ModelArtsMountPath,
NasType: setting.ModelArtsNasType,
}, },
}, jobId) }, jobId)
} }
@@ -972,14 +984,14 @@ func getJupyterBaseUrl(url string) string {
} }


func getCookiesAndCsrf(jupyterUrl string) ([]*http.Cookie, string) { func getCookiesAndCsrf(jupyterUrl string) ([]*http.Cookie, string) {
log.Info("jupyter url:"+jupyterUrl)
log.Info("jupyter url:" + jupyterUrl)
var cookies []*http.Cookie var cookies []*http.Cookie
const retryTimes = 10 const retryTimes = 10
for i := 0; i < retryTimes; i++ { for i := 0; i < retryTimes; i++ {
res, err := http.Get(jupyterUrl) res, err := http.Get(jupyterUrl)
if err != nil { if err != nil {
log.Error("browser jupyterUrl failed.",err)
if i==retryTimes-1{
log.Error("browser jupyterUrl failed.", err)
if i == retryTimes-1 {
return cookies, "" return cookies, ""
} }




+ 3
- 1
modules/modelarts/resty.go View File

@@ -497,7 +497,7 @@ sendjob:
} }


req, _ := json.Marshal(createJobParams) req, _ := json.Marshal(createJobParams)
log.Info("%s", req)
log.Info("postapi json: %s", req)


if res.StatusCode() == http.StatusUnauthorized && retry < 1 { if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
retry++ retry++
@@ -543,6 +543,8 @@ func createTrainJob(createJobParams models.CreateTrainJobParams) (*models.Create
var result models.CreateTrainJobResult var result models.CreateTrainJobResult


retry := 0 retry := 0
req, _ := json.Marshal(createJobParams)
log.Info("postapi json: %s", req)


sendjob: sendjob:
res, err := client.R(). res, err := client.R().


+ 6
- 0
modules/setting/setting.go View File

@@ -585,6 +585,9 @@ var (
TrainJobFLAVORINFOS string TrainJobFLAVORINFOS string
ModelArtsSpecialPools string ModelArtsSpecialPools string
ModelArtsMultiNode string ModelArtsMultiNode string
ModelArtsShareAddr string
ModelArtsMountPath string
ModelArtsNasType string
//kanban //kanban
IsCloudbrainTimingEnabled bool IsCloudbrainTimingEnabled bool


@@ -1557,6 +1560,9 @@ func NewContext() {
TrainJobFLAVORINFOS = sec.Key("TrainJob_FLAVOR_INFOS").MustString("") TrainJobFLAVORINFOS = sec.Key("TrainJob_FLAVOR_INFOS").MustString("")
ModelArtsSpecialPools = sec.Key("SPECIAL_POOL").MustString("") ModelArtsSpecialPools = sec.Key("SPECIAL_POOL").MustString("")
ModelArtsMultiNode = sec.Key("MULTI_NODE").MustString("") ModelArtsMultiNode = sec.Key("MULTI_NODE").MustString("")
ModelArtsShareAddr = sec.Key("ModelArts_Share_Addr").MustString("192.168.0.30:/")
ModelArtsMountPath = sec.Key("ModelArts_Mount_Path").MustString("/cache/sfs")
ModelArtsNasType = sec.Key("ModelArts_Nas_Type").MustString("nfs")


sec = Cfg.Section("elk") sec = Cfg.Section("elk")
ElkUrl = sec.Key("ELKURL").MustString("") ElkUrl = sec.Key("ELKURL").MustString("")


Loading…
Cancel
Save