You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

cloudbrain.go 37 kB

3 years ago
3 years ago
4 years ago
3 years ago
4 years ago
4 years ago
4 years ago
3 years ago
3 years ago
4 years ago
4 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
5 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
3 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
3 years ago
4 years ago
3 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
3 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
3 years ago
5 years ago
4 years ago
3 years ago
5 years ago
3 years ago
5 years ago
3 years ago
3 years ago
3 years ago
5 years ago
4 years ago
3 years ago
3 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169
  1. package models
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "strings"
  6. "time"
  7. "xorm.io/builder"
  8. "xorm.io/xorm"
  9. "code.gitea.io/gitea/modules/log"
  10. "code.gitea.io/gitea/modules/setting"
  11. "code.gitea.io/gitea/modules/timeutil"
  12. )
  13. type CloudbrainStatus string
  14. type JobType string
  15. type ModelArtsJobStatus string
  16. const (
  17. JobWaiting CloudbrainStatus = "WAITING"
  18. JobStopped CloudbrainStatus = "STOPPED"
  19. JobSucceeded CloudbrainStatus = "SUCCEEDED"
  20. JobFailed CloudbrainStatus = "FAILED"
  21. JobRunning CloudbrainStatus = "RUNNING"
  22. JobTypeDebug JobType = "DEBUG"
  23. JobTypeBenchmark JobType = "BENCHMARK"
  24. JobTypeSnn4imagenet JobType = "SNN4IMAGENET"
  25. JobTypeBrainScore JobType = "BRAINSCORE"
  26. JobTypeTrain JobType = "TRAIN"
  27. JobVersionName JobType = "V0001"
  28. ModelArtsCreateQueue ModelArtsJobStatus = "CREATE_QUEUING" //免费资源创建排队中
  29. ModelArtsCreating ModelArtsJobStatus = "CREATING" //创建中
  30. ModelArtsCreateFailed ModelArtsJobStatus = "CREATE_FAILED" //创建失败
  31. ModelArtsStartQueuing ModelArtsJobStatus = "START_QUEUING" //免费资源启动排队中
  32. ModelArtsReadyToStart ModelArtsJobStatus = "READY_TO_START" //免费资源等待启动
  33. ModelArtsStarting ModelArtsJobStatus = "STARTING" //启动中
  34. ModelArtsRestarting ModelArtsJobStatus = "RESTARTING" //重启中
  35. ModelArtsStartFailed ModelArtsJobStatus = "START_FAILED" //启动失败
  36. ModelArtsRunning ModelArtsJobStatus = "RUNNING" //运行中
  37. ModelArtsStopping ModelArtsJobStatus = "STOPPING" //停止中
  38. ModelArtsStopped ModelArtsJobStatus = "STOPPED" //停止
  39. ModelArtsUnavailable ModelArtsJobStatus = "UNAVAILABLE" //故障
  40. ModelArtsDeleted ModelArtsJobStatus = "DELETED" //已删除
  41. ModelArtsResizing ModelArtsJobStatus = "RESIZING" //规格变更中
  42. ModelArtsResizFailed ModelArtsJobStatus = "RESIZE_FAILED" //规格变更失败
  43. )
  44. type Cloudbrain struct {
  45. ID int64 `xorm:"pk autoincr"`
  46. JobID string `xorm:"INDEX NOT NULL"`
  47. JobType string `xorm:"INDEX NOT NULL DEFAULT 'DEBUG'"`
  48. JobName string `xorm:"INDEX"`
  49. Status string `xorm:"INDEX"`
  50. UserID int64 `xorm:"INDEX"`
  51. RepoID int64 `xorm:"INDEX"`
  52. SubTaskName string `xorm:"INDEX"`
  53. ContainerID string
  54. ContainerIp string
  55. CreatedUnix timeutil.TimeStamp `xorm:"INDEX created"`
  56. UpdatedUnix timeutil.TimeStamp `xorm:"INDEX updated"`
  57. Duration int64 `xorm:"INDEX duration"`
  58. TrainJobDuration string
  59. DeletedAt time.Time `xorm:"deleted"`
  60. CanDebug bool `xorm:"-"`
  61. CanDel bool `xorm:"-"`
  62. Type int `xorm:"INDEX DEFAULT 0"`
  63. VersionID int64 `xorm:"INDEX DEFAULT 0"`
  64. VersionName string `xorm:"INDEX"`
  65. Uuid string
  66. DatasetName string
  67. VersionCount int64 `xorm:"INDEX DEFAULT 1"`
  68. IsLatestVersion string
  69. CommitID string
  70. FatherVersionName string
  71. ComputeResource string
  72. EngineID int64
  73. TrainUrl string
  74. BranchName string
  75. Parameters string
  76. BootFile string
  77. DataUrl string
  78. LogUrl string
  79. PreVersionId int64
  80. FlavorCode string
  81. Description string
  82. WorkServerNumber int
  83. FlavorName string
  84. User *User `xorm:"-"`
  85. Repo *Repository `xorm:"-"`
  86. }
  87. type TrainjobConfigDetail struct {
  88. ID int64 `xorm:"pk autoincr"`
  89. JobID string `xorm:"INDEX"`
  90. JobName string `xorm:"INDEX"`
  91. ResourcePools string `xorm:"INDEX"`
  92. EngineVersions int `xorm:"INDEX"`
  93. FlavorInfos string `xorm:"INDEX"`
  94. TrainUrl string `xorm:"INDEX"`
  95. BootFile string `xorm:"INDEX"`
  96. Uuid string `xorm:"INDEX"`
  97. DatasetName string `xorm:"INDEX"`
  98. Params string `xorm:"INDEX"`
  99. BranchName string `xorm:"INDEX"`
  100. VersionName string `xorm:"INDEX"`
  101. User *User `xorm:"-"`
  102. Repo *Repository `xorm:"-"`
  103. }
  104. type CloudbrainInfo struct {
  105. Cloudbrain `xorm:"extends"`
  106. User `xorm:"extends"`
  107. }
  108. type CloudBrainLoginResult struct {
  109. Code string
  110. Msg string
  111. Payload map[string]interface{}
  112. }
  113. type TaskRole struct {
  114. Name string `json:"name"`
  115. TaskNumber int `json:"taskNumber"`
  116. MinSucceededTaskCount int `json:"minSucceededTaskCount"`
  117. MinFailedTaskCount int `json:"minFailedTaskCount"`
  118. CPUNumber int `json:"cpuNumber"`
  119. GPUNumber int `json:"gpuNumber"`
  120. MemoryMB int `json:"memoryMB"`
  121. ShmMB int `json:"shmMB"`
  122. Command string `json:"command"`
  123. NeedIBDevice bool `json:"needIBDevice"`
  124. IsMainRole bool `json:"isMainRole"`
  125. UseNNI bool `json:"useNNI"`
  126. }
  127. type StHostPath struct {
  128. Path string `json:"path"`
  129. MountPath string `json:"mountPath"`
  130. ReadOnly bool `json:"readOnly"`
  131. }
  132. type Volume struct {
  133. HostPath StHostPath `json:"hostPath"`
  134. }
  135. type CreateJobParams struct {
  136. JobName string `json:"jobName"`
  137. RetryCount int8 `json:"retryCount"`
  138. GpuType string `json:"gpuType"`
  139. Image string `json:"image"`
  140. TaskRoles []TaskRole `json:"taskRoles"`
  141. Volumes []Volume `json:"volumes"`
  142. }
  143. type CreateJobResult struct {
  144. Code string `json:"code"`
  145. Msg string `json:"msg"`
  146. Payload map[string]interface{} `json:"payload"`
  147. }
  148. type GetJobResult struct {
  149. Code string `json:"code"`
  150. Msg string `json:"msg"`
  151. Payload map[string]interface{} `json:"payload"`
  152. }
  153. type GetImagesResult struct {
  154. Code string `json:"code"`
  155. Msg string `json:"msg"`
  156. Payload GetImagesPayload `json:"payload"`
  157. }
  158. type GetImagesPayload struct {
  159. Count int `json:"count"`
  160. TotalPages int `json:"totalPages,omitempty"`
  161. ImageInfo []*ImageInfo `json:"rows"`
  162. }
  163. type CloudbrainsOptions struct {
  164. ListOptions
  165. RepoID int64 // include all repos if empty
  166. UserID int64
  167. JobID string
  168. SortType string
  169. CloudbrainIDs []int64
  170. // JobStatus CloudbrainStatus
  171. Type int
  172. JobType string
  173. VersionName string
  174. IsLatestVersion string
  175. }
  176. type TaskPod struct {
  177. TaskRoleStatus struct {
  178. Name string `json:"name"`
  179. } `json:"taskRoleStatus"`
  180. //TaskStatuses []struct {
  181. // TaskIndex int `json:"taskIndex"`
  182. // PodUID string `json:"podUid"`
  183. // PodIP string `json:"podIp"`
  184. // PodName string `json:"podName"`
  185. // ContainerID string `json:"containerId"`
  186. // ContainerIP string `json:"containerIp"`
  187. // ContainerGpus string `json:"containerGpus"`
  188. // State string `json:"state"`
  189. // StartAt time.Time `json:"startAt"`
  190. // FinishedAt time.Time `json:"finishedAt"`
  191. // ExitCode int `json:"exitCode"`
  192. // ExitDiagnostics string `json:"exitDiagnostics"`
  193. // RetriedCount int `json:"retriedCount"`
  194. // StartTime string
  195. // FinishedTime string
  196. //} `json:"taskStatuses"`
  197. TaskStatuses []TaskStatuses `json:"taskStatuses"`
  198. }
  199. type TaskStatuses struct {
  200. TaskIndex int `json:"taskIndex"`
  201. PodUID string `json:"podUid"`
  202. PodIP string `json:"podIp"`
  203. PodName string `json:"podName"`
  204. ContainerID string `json:"containerId"`
  205. ContainerIP string `json:"containerIp"`
  206. ContainerGpus string `json:"containerGpus"`
  207. State string `json:"state"`
  208. StartAt time.Time `json:"startAt"`
  209. FinishedAt time.Time `json:"finishedAt"`
  210. ExitCode int `json:"exitCode"`
  211. ExitDiagnostics string `json:"exitDiagnostics"`
  212. RetriedCount int `json:"retriedCount"`
  213. StartTime string
  214. FinishedTime string
  215. }
  216. type TaskInfo struct {
  217. Username string `json:"username"`
  218. TaskName string `json:"task_name"`
  219. CodeName string `json:"code_name"`
  220. BenchmarkCategory []string `json:"selected_category"`
  221. CodeLink string `json:"code_link"`
  222. GpuType string `json:"gpu_type"`
  223. }
  224. func ConvertToTaskPod(input map[string]interface{}) (TaskPod, error) {
  225. data, _ := json.Marshal(input)
  226. var taskPod TaskPod
  227. err := json.Unmarshal(data, &taskPod)
  228. taskPod.TaskStatuses[0].StartTime = time.Unix(taskPod.TaskStatuses[0].StartAt.Unix()+8*3600, 0).UTC().Format("2006-01-02 15:04:05")
  229. taskPod.TaskStatuses[0].FinishedTime = time.Unix(taskPod.TaskStatuses[0].FinishedAt.Unix()+8*3600, 0).UTC().Format("2006-01-02 15:04:05")
  230. //if the task is not finished or stopped,the cloudbrain renturns 0001-01-01 08:00:00, the finishedTime shows with -
  231. if strings.HasPrefix(taskPod.TaskStatuses[0].FinishedTime, "0001") {
  232. taskPod.TaskStatuses[0].FinishedTime = "-"
  233. }
  234. return taskPod, err
  235. }
  236. type JobResultPayload struct {
  237. ID string `json:"id"`
  238. Name string `json:"name"`
  239. Platform string `json:"platform"`
  240. JobStatus struct {
  241. Username string `json:"username"`
  242. State string `json:"state"`
  243. SubState string `json:"subState"`
  244. ExecutionType string `json:"executionType"`
  245. Retries int `json:"retries"`
  246. CreatedTime int64 `json:"createdTime"`
  247. CompletedTime int64 `json:"completedTime"`
  248. AppID string `json:"appId"`
  249. AppProgress string `json:"appProgress"`
  250. AppTrackingURL string `json:"appTrackingUrl"`
  251. AppLaunchedTime int64 `json:"appLaunchedTime"`
  252. AppCompletedTime interface{} `json:"appCompletedTime"`
  253. AppExitCode int `json:"appExitCode"`
  254. AppExitDiagnostics string `json:"appExitDiagnostics"`
  255. AppExitType interface{} `json:"appExitType"`
  256. VirtualCluster string `json:"virtualCluster"`
  257. StartTime string
  258. EndTime string
  259. } `json:"jobStatus"`
  260. TaskRoles map[string]interface{} `json:"taskRoles"`
  261. Resource struct {
  262. CPU int `json:"cpu"`
  263. Memory string `json:"memory"`
  264. NvidiaComGpu int `json:"nvidia.com/gpu"`
  265. } `json:"resource"`
  266. Config struct {
  267. Image string `json:"image"`
  268. JobID string `json:"jobId"`
  269. GpuType string `json:"gpuType"`
  270. JobName string `json:"jobName"`
  271. JobType string `json:"jobType"`
  272. TaskRoles []struct {
  273. Name string `json:"name"`
  274. ShmMB int `json:"shmMB"`
  275. Command string `json:"command"`
  276. MemoryMB int `json:"memoryMB"`
  277. CPUNumber int `json:"cpuNumber"`
  278. GpuNumber int `json:"gpuNumber"`
  279. IsMainRole bool `json:"isMainRole"`
  280. TaskNumber int `json:"taskNumber"`
  281. NeedIBDevice bool `json:"needIBDevice"`
  282. MinFailedTaskCount int `json:"minFailedTaskCount"`
  283. MinSucceededTaskCount int `json:"minSucceededTaskCount"`
  284. } `json:"taskRoles"`
  285. RetryCount int `json:"retryCount"`
  286. } `json:"config"`
  287. Userinfo struct {
  288. User string `json:"user"`
  289. OrgID string `json:"org_id"`
  290. } `json:"userinfo"`
  291. }
  292. func ConvertToJobResultPayload(input map[string]interface{}) (JobResultPayload, error) {
  293. data, _ := json.Marshal(input)
  294. var jobResultPayload JobResultPayload
  295. err := json.Unmarshal(data, &jobResultPayload)
  296. jobResultPayload.JobStatus.StartTime = time.Unix(jobResultPayload.JobStatus.CreatedTime/1000, 0).Format("2006-01-02 15:04:05")
  297. jobResultPayload.JobStatus.EndTime = time.Unix(jobResultPayload.JobStatus.CompletedTime/1000, 0).Format("2006-01-02 15:04:05")
  298. if jobResultPayload.JobStatus.State == string(JobWaiting) {
  299. jobResultPayload.JobStatus.StartTime = "-"
  300. jobResultPayload.JobStatus.EndTime = "-"
  301. }
  302. return jobResultPayload, err
  303. }
  304. type ImagesResultPayload struct {
  305. Images []struct {
  306. ID int `json:"id"`
  307. Name string `json:"name"`
  308. Place string `json:"place"`
  309. Description string `json:"description"`
  310. Provider string `json:"provider"`
  311. Createtime string `json:"createtime"`
  312. Remark string `json:"remark"`
  313. } `json:"taskStatuses"`
  314. }
  315. type ImageInfo struct {
  316. ID int `json:"id"`
  317. Name string `json:"name"`
  318. Place string `json:"place"`
  319. Description string `json:"description"`
  320. Provider string `json:"provider"`
  321. Createtime string `json:"createtime"`
  322. Remark string `json:"remark"`
  323. IsPublic int `json:"isPublic"`
  324. PlaceView string
  325. }
  326. type Categories struct {
  327. Category []*Category `json:"category"`
  328. }
  329. type Category struct {
  330. Id int `json:"id"`
  331. Value string `json:"value"`
  332. }
  333. type GpuInfos struct {
  334. GpuInfo []*GpuInfo `json:"gpu_type"`
  335. }
  336. type GpuInfo struct {
  337. Id int `json:"id"`
  338. Value string `json:"value"`
  339. Queue string `json:"queue"`
  340. }
  341. type ResourceSpecs struct {
  342. ResourceSpec []*ResourceSpec `json:"resorce_specs"`
  343. }
  344. type ResourceSpec struct {
  345. Id int `json:"id"`
  346. CpuNum int `json:"cpu"`
  347. GpuNum int `json:"gpu"`
  348. MemMiB int `json:"memMiB"`
  349. ShareMemMiB int `json:"shareMemMiB"`
  350. }
  351. type FlavorInfos struct {
  352. FlavorInfo []*FlavorInfo `json:"flavor_info"`
  353. }
  354. type FlavorInfo struct {
  355. Id int `json:"id"`
  356. Value string `json:"value"`
  357. }
  358. type PoolInfos struct {
  359. PoolInfo []*PoolInfo `json:"pool_info"`
  360. }
  361. type PoolInfo struct {
  362. PoolId string `json:"pool_id"`
  363. PoolName string `json:"pool_name"`
  364. PoolType string `json:"pool_type"`
  365. }
  366. type CommitImageParams struct {
  367. Ip string `json:"ip"`
  368. TaskContainerId string `json:"taskContainerId"`
  369. ImageTag string `json:"imageTag"`
  370. ImageDescription string `json:"imageDescription"`
  371. }
  372. type CommitImageResult struct {
  373. Code string `json:"code"`
  374. Msg string `json:"msg"`
  375. Payload map[string]interface{} `json:"payload"`
  376. }
  377. type CloudBrainResult struct {
  378. Code string `json:"code"`
  379. Msg string `json:"msg"`
  380. }
  381. type CreateNotebookParams struct {
  382. JobName string `json:"name"`
  383. Description string `json:"description"`
  384. ProfileID string `json:"profile_id"`
  385. Flavor string `json:"flavor"`
  386. Spec Spec `json:"spec"`
  387. Workspace Workspace `json:"workspace"`
  388. Pool Pool `json:"pool"`
  389. }
  390. type Pool struct {
  391. ID string `json:"id"`
  392. Name string `json:"name"`
  393. Type string `json:"type"`
  394. }
  395. type Workspace struct {
  396. ID string `json:"id"`
  397. }
  398. type Spec struct {
  399. Storage Storage `json:"storage"`
  400. AutoStop AutoStop `json:"auto_stop"`
  401. }
  402. type AutoStop struct {
  403. Enable bool `json:"enable"`
  404. Duration int `json:"duration"`
  405. }
  406. type Storage struct {
  407. Type string `json:"type"`
  408. Location Location `json:"location"`
  409. }
  410. type Location struct {
  411. Path string `json:"path"`
  412. }
  413. type NotebookResult struct {
  414. ErrorCode string `json:"error_code"`
  415. ErrorMsg string `json:"error_msg"`
  416. }
  417. type CreateNotebookResult struct {
  418. ErrorCode string `json:"error_code"`
  419. ErrorMsg string `json:"error_msg"`
  420. ID string `json:"id"`
  421. Name string `json:"name"`
  422. Description string `json:"description"`
  423. Status string `json:"status"`
  424. CreationTimestamp string `json:"creation_timestamp"`
  425. LatestUpdateTimestamp string `json:"latest_update_timestamp"`
  426. Profile struct {
  427. ID string `json:"id"`
  428. Name string `json:"name"`
  429. Description string `json:"description"`
  430. DeType string `json:"de_type"`
  431. FlavorType string `json:"flavor_type"`
  432. } `json:"profile"`
  433. Flavor string `json:"flavor"`
  434. FlavorDetails struct {
  435. Name string `json:"name"`
  436. Status string `json:"status"`
  437. QueuingNum int `json:"queuing_num"`
  438. QueueLeftTime int `json:"queue_left_time"` //s
  439. Duration int `json:"duration"` //auto_stop_time s
  440. } `json:"flavor_details"`
  441. }
  442. type GetNotebookResult struct {
  443. ErrorCode string `json:"error_code"`
  444. ErrorMsg string `json:"error_msg"`
  445. ID string `json:"id"`
  446. Name string `json:"name"`
  447. Description string `json:"description"`
  448. Status string `json:"status"`
  449. CreationTimestamp string `json:"creation_timestamp"`
  450. CreateTime string
  451. LatestUpdateTimestamp string `json:"latest_update_timestamp"`
  452. LatestUpdateTime string
  453. Profile struct {
  454. ID string `json:"id"`
  455. Name string `json:"name"`
  456. Description string `json:"description"`
  457. DeType string `json:"de_type"`
  458. FlavorType string `json:"flavor_type"`
  459. } `json:"profile"`
  460. Flavor string `json:"flavor"`
  461. FlavorDetails struct {
  462. Name string `json:"name"`
  463. Status string `json:"status"`
  464. QueuingNum int `json:"queuing_num"`
  465. QueueLeftTime int `json:"queue_left_time"` //s
  466. Duration int `json:"duration"` //auto_stop_time s
  467. } `json:"flavor_details"`
  468. QueuingInfo struct {
  469. ID string `json:"id"`
  470. Name string `json:"name"`
  471. Flavor string `json:"flavor"`
  472. DeType string `json:"de_type"`
  473. Status string `json:"status"`
  474. BeginTimestamp int `json:"begin_timestamp"` //time of instance begin in queue
  475. BeginTime string
  476. RemainTime int `json:"remain_time"` //remain time of instance
  477. EndTimestamp int `json:"end_timestamp"` //
  478. EndTime string
  479. Rank int `json:"rank"` //rank of instance in queue
  480. } `json:"queuing_info"`
  481. Spec struct {
  482. Annotations struct {
  483. TargetDomain string `json:"target_domain"`
  484. Url string `json:"url"`
  485. } `json:"annotations"`
  486. } `json:"spec"`
  487. }
  488. type GetTokenParams struct {
  489. Auth Auth `json:"auth"`
  490. }
  491. type Auth struct {
  492. Identity Identity `json:"identity"`
  493. Scope Scope `json:"scope"`
  494. }
  495. type Scope struct {
  496. Project Project `json:"project"`
  497. }
  498. type Project struct {
  499. Name string `json:"name"`
  500. }
  501. type Identity struct {
  502. Methods []string `json:"methods"`
  503. Password Password `json:"password"`
  504. }
  505. type Password struct {
  506. User NotebookUser `json:"user"`
  507. }
  508. type NotebookUser struct {
  509. Name string `json:"name"`
  510. Password string `json:"password"`
  511. Domain Domain `json:"domain"`
  512. }
  513. type Domain struct {
  514. Name string `json:"name"`
  515. }
  516. const (
  517. ActionStart = "start"
  518. ActionStop = "stop"
  519. ActionRestart = "restart"
  520. ActionQueue = "queue"
  521. ActionDequeue = "dequeue"
  522. )
  523. type NotebookAction struct {
  524. Action string `json:"action"`
  525. }
  526. type NotebookActionResult struct {
  527. ErrorCode string `json:"error_code"`
  528. ErrorMsg string `json:"error_msg"`
  529. CurrentStatus string `json:"current_status"`
  530. PreviousState string `json:"previous_state"`
  531. }
  532. type NotebookGetJobTokenResult struct {
  533. ErrorCode string `json:"error_code"`
  534. ErrorMsg string `json:"error_msg"`
  535. Token string `json:"token"`
  536. }
  537. type NotebookDelResult struct {
  538. InstanceID string `json:"instance_id"`
  539. }
  540. type CreateTrainJobParams struct {
  541. JobName string `json:"job_name"`
  542. Description string `json:"job_desc"`
  543. Config Config `json:"config"`
  544. WorkspaceID string `json:"workspace_id"`
  545. }
  546. type Config struct {
  547. WorkServerNum int `json:"worker_server_num"`
  548. AppUrl string `json:"app_url"` //训练作业的代码目录
  549. BootFileUrl string `json:"boot_file_url"` //训练作业的代码启动文件,需要在代码目录下
  550. Parameter []Parameter `json:"parameter"`
  551. DataUrl string `json:"data_url"` //训练作业需要的数据集OBS路径URL
  552. //DatasetID string `json:"dataset_id"`
  553. //DataVersionID string `json:"dataset_version_id"`
  554. //DataSource []DataSource `json:"data_source"`
  555. //SpecID int64 `json:"spec_id"`
  556. EngineID int64 `json:"engine_id"`
  557. //ModelID int64 `json:"model_id"`
  558. TrainUrl string `json:"train_url"` //训练作业的输出文件OBS路径URL
  559. LogUrl string `json:"log_url"`
  560. //UserImageUrl string `json:"user_image_url"`
  561. //UserCommand string `json:"user_command"`
  562. CreateVersion bool `json:"create_version"`
  563. //Volumes []Volumes `json:"volumes"`
  564. Flavor Flavor `json:"flavor"`
  565. PoolID string `json:"pool_id"`
  566. }
  567. type CreateTrainJobVersionParams struct {
  568. Description string `json:"job_desc"`
  569. Config TrainJobVersionConfig `json:"config"`
  570. }
  571. type TrainJobVersionConfig struct {
  572. WorkServerNum int `json:"worker_server_num"`
  573. AppUrl string `json:"app_url"` //训练作业的代码目录
  574. BootFileUrl string `json:"boot_file_url"` //训练作业的代码启动文件,需要在代码目录下
  575. Parameter []Parameter `json:"parameter"`
  576. DataUrl string `json:"data_url"` //训练作业需要的数据集OBS路径URL
  577. //DatasetID string `json:"dataset_id"`
  578. //DataVersionID string `json:"dataset_version_id"`
  579. //DataSource []DataSource `json:"data_source"`
  580. //SpecID int64 `json:"spec_id"`
  581. EngineID int64 `json:"engine_id"`
  582. //ModelID int64 `json:"model_id"`
  583. TrainUrl string `json:"train_url"` //训练作业的输出文件OBS路径URL
  584. LogUrl string `json:"log_url"`
  585. //UserImageUrl string `json:"user_image_url"`
  586. //UserCommand string `json:"user_command"`
  587. //Volumes []Volumes `json:"volumes"`
  588. Flavor Flavor `json:"flavor"`
  589. PoolID string `json:"pool_id"`
  590. PreVersionId int64 `json:"pre_version_id"`
  591. }
  592. type CreateConfigParams struct {
  593. ConfigName string `json:"config_name"`
  594. Description string `json:"config_desc"`
  595. WorkServerNum int `json:"worker_server_num"`
  596. AppUrl string `json:"app_url"` //训练作业的代码目录
  597. BootFileUrl string `json:"boot_file_url"` //训练作业的代码启动文件,需要在代码目录下
  598. Parameter []Parameter `json:"parameter"`
  599. DataUrl string `json:"data_url"` //训练作业需要的数据集OBS路径URL
  600. //DatasetID string `json:"dataset_id"`
  601. //DataVersionID string `json:"dataset_version_id"`
  602. //DataSource []DataSource `json:"data_source"`
  603. //SpecID int64 `json:"spec_id"`
  604. EngineID int64 `json:"engine_id"`
  605. //ModelID int64 `json:"model_id"`
  606. TrainUrl string `json:"train_url"` //训练作业的输出文件OBS路径URL
  607. LogUrl string `json:"log_url"`
  608. //UserImageUrl string `json:"user_image_url"`
  609. //UserCommand string `json:"user_command"`
  610. //CreateVersion bool `json:"create_version"`
  611. //Volumes []Volumes `json:"volumes"`
  612. Flavor Flavor `json:"flavor"`
  613. PoolID string `json:"pool_id"`
  614. }
  615. type Parameter struct {
  616. Label string `json:"label"`
  617. Value string `json:"value"`
  618. }
  619. type Parameters struct {
  620. Parameter []Parameter `json:"parameter"`
  621. }
  622. type DataSource struct {
  623. DatasetID string `json:"dataset_id"`
  624. DatasetVersion string `json:"dataset_version"`
  625. Type string `json:"type"`
  626. DataUrl string `json:"data_url"`
  627. }
  628. type Volumes struct {
  629. Nfs Nfs `json:"nfs"`
  630. HostPath HostPath `json:"host_path"`
  631. }
  632. type Nfs struct {
  633. ID string `json:"id"`
  634. SourcePath string `json:"src_path"`
  635. DestPath string `json:"dest_path"`
  636. ReadOnly bool `json:"read_only"`
  637. }
  638. type HostPath struct {
  639. SourcePath string `json:"src_path"`
  640. DestPath string `json:"dest_path"`
  641. ReadOnly bool `json:"read_only"`
  642. }
  643. type Flavor struct {
  644. Code string `json:"code"`
  645. }
  646. type CreateTrainJobResult struct {
  647. ErrorCode string `json:"error_code"`
  648. ErrorMsg string `json:"error_msg"`
  649. IsSuccess bool `json:"is_success"`
  650. JobName string `json:"job_name"`
  651. JobID int64 `json:"job_id"`
  652. Status int `json:"status"`
  653. CreateTime int64 `json:"create_time"`
  654. VersionID int64 `json:"version_id"`
  655. ResourceID string `json:"resource_id"`
  656. VersionName string `json:"version_name"`
  657. }
  658. type CreateTrainJobConfigResult struct {
  659. ErrorCode string `json:"error_code"`
  660. ErrorMsg string `json:"error_msg"`
  661. IsSuccess bool `json:"is_success"`
  662. }
  663. type GetResourceSpecsResult struct {
  664. ErrorCode string `json:"error_code"`
  665. ErrorMsg string `json:"error_msg"`
  666. IsSuccess bool `json:"is_success"`
  667. SpecTotalCount int `json:"spec_total_count"`
  668. Specs []Specs `json:"specs"`
  669. }
  670. type Specs struct {
  671. Core string `json:"core"`
  672. Cpu string `json:"cpu"`
  673. IsNoResource bool `json:"no_resource"`
  674. GpuType string `json:"gpu_type"`
  675. SpecID int64 `json:"spec_id"`
  676. GpuNum int `json:"gpu_num"`
  677. SpecCode string `json:"spec_code"`
  678. Storage string `json:"storage"`
  679. MaxNum int `json:"max_num"`
  680. UnitNum int `json:"unit_num"`
  681. InterfaceType int `json:"interface_type"`
  682. }
  683. type GetConfigListResult struct {
  684. ErrorCode string `json:"error_code"`
  685. ErrorMsg string `json:"error_msg"`
  686. IsSuccess bool `json:"is_success"`
  687. ConfigTotalCount int `json:"config_total_count"`
  688. ParaConfigs []ParaConfig `json:"configs"`
  689. }
  690. type ParaConfig struct {
  691. ConfigName string `json:"config_name"`
  692. ConfigDesc string `json:"config_desc"`
  693. CreateTime int64 `json:"create_time"`
  694. EngineType int `json:"engine_type"`
  695. EngineName string `json:"engine_name"`
  696. EngineId int64 `json:"engine_id"`
  697. EngineVersion string `json:"engine_version"`
  698. UserImageUrl string `json:"user_image_url"`
  699. UserCommand string `json:"user_command"`
  700. Result GetConfigResult
  701. }
  702. type GetConfigResult struct {
  703. ErrorCode string `json:"error_code"`
  704. ErrorMsg string `json:"error_msg"`
  705. IsSuccess bool `json:"is_success"`
  706. ConfigName string `json:"config_name"`
  707. Description string `json:"config_desc"`
  708. WorkServerNum int `json:"worker_server_num"`
  709. AppUrl string `json:"app_url"` //训练作业的代码目录
  710. BootFileUrl string `json:"boot_file_url"` //训练作业的代码启动文件,需要在代码目录下
  711. Parameter []Parameter `json:"parameter"`
  712. DataUrl string `json:"data_url"` //训练作业需要的数据集OBS路径URL
  713. //DatasetID string `json:"dataset_id"`
  714. //DataVersionID string `json:"dataset_version_id"`
  715. //DataSource []DataSource `json:"data_source"`
  716. //SpecID int64 `json:"spec_id"`
  717. EngineID int64 `json:"engine_id"`
  718. //ModelID int64 `json:"model_id"`
  719. TrainUrl string `json:"train_url"` //训练作业的输出文件OBS路径URL
  720. LogUrl string `json:"log_url"`
  721. //UserImageUrl string `json:"user_image_url"`
  722. //UserCommand string `json:"user_command"`
  723. //CreateVersion bool `json:"create_version"`
  724. //Volumes []Volumes `json:"volumes"`
  725. Flavor Flavor `json:"flavor"`
  726. PoolID string `json:"pool_id"`
  727. }
  728. type ErrorResult struct {
  729. ErrorCode string `json:"error_code"`
  730. ErrorMsg string `json:"error_message"`
  731. IsSuccess bool `json:"is_success"`
  732. }
  733. type GetTrainJobResult struct {
  734. IsSuccess bool `json:"is_success"`
  735. JobName string `json:"job_name"`
  736. JobID int64 `json:"job_id"`
  737. Description string `json:"job_desc"`
  738. IntStatus int `json:"status"`
  739. Status string
  740. LongCreateTime int64 `json:"create_time"`
  741. CreateTime string
  742. Duration int64 `json:"duration"` //训练作业的运行时间,单位为毫秒
  743. TrainJobDuration string //训练作业的运行时间,格式为hh:mm:ss
  744. VersionID int64 `json:"version_id"`
  745. ResourceID string `json:"resource_id"`
  746. VersionName string `json:"version_name"`
  747. PreVersionID int64 `json:"pre_version_id"`
  748. WorkServerNum int `json:"worker_server_num"`
  749. AppUrl string `json:"app_url"` //训练作业的代码目录
  750. BootFileUrl string `json:"boot_file_url"` //训练作业的代码启动文件,需要在代码目录下
  751. Parameter []Parameter `json:"parameter"`
  752. DataUrl string `json:"data_url"` //训练作业需要的数据集OBS路径URL
  753. //DatasetID string `json:"dataset_id"`
  754. //DataVersionID string `json:"dataset_version_id"`
  755. //DataSource []DataSource `json:"data_source"`
  756. //SpecID int64 `json:"spec_id"`
  757. EngineID int64 `json:"engine_id"`
  758. EngineName string `json:"engine_name"`
  759. EngineVersion string `json:"engine_version"`
  760. //ModelID int64 `json:"model_id"`
  761. TrainUrl string `json:"train_url"` //训练作业的输出文件OBS路径URL
  762. LogUrl string `json:"log_url"`
  763. //UserImageUrl string `json:"user_image_url"`
  764. //UserCommand string `json:"user_command"`
  765. //Volumes []Volumes `json:"volumes"`
  766. Flavor Flavor `json:"flavor"`
  767. PoolID string `json:"pool_id"`
  768. PoolName string `json:"pool_name"`
  769. NasMountPath string `json:"nas_mount_path"`
  770. NasShareAddr string `json:"nas_share_addr"`
  771. DatasetName string
  772. ModelMetricList string `json:"model_metric_list"` //列表里包含f1_score,recall,precision,accuracy,若有的话
  773. }
  774. type GetTrainJobLogResult struct {
  775. ErrorCode string `json:"error_code"`
  776. ErrorMsg string `json:"error_msg"`
  777. IsSuccess bool `json:"is_success"`
  778. Content string `json:"content"`
  779. Lines int `json:"lines"`
  780. StartLine string `json:"start_line"`
  781. EndLine string `json:"end_line"`
  782. }
  783. type GetTrainJobLogFileNamesResult struct {
  784. ErrorCode string `json:"error_code"`
  785. ErrorMsg string `json:"error_msg"`
  786. IsSuccess bool `json:"is_success"`
  787. LogFileList []string `json:"log_file_list"`
  788. }
  789. type TrainJobResult struct {
  790. ErrorCode string `json:"error_code"`
  791. ErrorMsg string `json:"error_msg"`
  792. IsSuccess bool `json:"is_success"`
  793. }
  794. type LogFile struct {
  795. Name string
  796. }
  797. func Cloudbrains(opts *CloudbrainsOptions) ([]*CloudbrainInfo, int64, error) {
  798. sess := x.NewSession()
  799. defer sess.Close()
  800. var cond = builder.NewCond()
  801. if opts.RepoID > 0 {
  802. cond = cond.And(
  803. builder.Eq{"cloudbrain.repo_id": opts.RepoID},
  804. )
  805. }
  806. if opts.UserID > 0 {
  807. cond = cond.And(
  808. builder.Eq{"cloudbrain.user_id": opts.UserID},
  809. )
  810. }
  811. if (opts.JobID) != "" {
  812. cond = cond.And(
  813. builder.Eq{"cloudbrain.job_id": opts.JobID},
  814. )
  815. }
  816. if (opts.Type) >= 0 {
  817. cond = cond.And(
  818. builder.Eq{"cloudbrain.type": opts.Type},
  819. )
  820. }
  821. if (opts.JobType) != "" {
  822. cond = cond.And(
  823. builder.Eq{"cloudbrain.job_type": opts.JobType},
  824. )
  825. }
  826. if (opts.IsLatestVersion) != "" {
  827. cond = cond.And(
  828. builder.Eq{"cloudbrain.is_latest_version": opts.IsLatestVersion},
  829. )
  830. }
  831. // switch opts.JobStatus {
  832. // case JobWaiting:
  833. // cond.And(builder.Eq{"cloudbrain.status": int(JobWaiting)})
  834. // case JobFailed:
  835. // cond.And(builder.Eq{"cloudbrain.status": int(JobFailed)})
  836. // case JobStopped:
  837. // cond.And(builder.Eq{"cloudbrain.status": int(JobStopped)})
  838. // case JobSucceeded:
  839. // cond.And(builder.Eq{"cloudbrain.status": int(JobSucceeded)})
  840. // }
  841. if len(opts.CloudbrainIDs) > 0 {
  842. cond = cond.And(builder.In("cloudbrain.id", opts.CloudbrainIDs))
  843. }
  844. count, err := sess.Where(cond).Count(new(Cloudbrain))
  845. if err != nil {
  846. return nil, 0, fmt.Errorf("Count: %v", err)
  847. }
  848. if opts.Page >= 0 && opts.PageSize > 0 {
  849. var start int
  850. if opts.Page == 0 {
  851. start = 0
  852. } else {
  853. start = (opts.Page - 1) * opts.PageSize
  854. }
  855. sess.Limit(opts.PageSize, start)
  856. }
  857. sess.OrderBy("cloudbrain.created_unix DESC")
  858. cloudbrains := make([]*CloudbrainInfo, 0, setting.UI.IssuePagingNum)
  859. if err := sess.Table(&Cloudbrain{}).Where(cond).
  860. Join("left", "`user`", "cloudbrain.user_id = `user`.id").
  861. Find(&cloudbrains); err != nil {
  862. return nil, 0, fmt.Errorf("Find: %v", err)
  863. }
  864. sess.Close()
  865. return cloudbrains, count, nil
  866. }
  867. func CloudbrainsVersionList(opts *CloudbrainsOptions) ([]*CloudbrainInfo, int64, error) {
  868. sess := x.NewSession()
  869. defer sess.Close()
  870. var cond = builder.NewCond()
  871. if opts.RepoID > 0 {
  872. cond = cond.And(
  873. builder.Eq{"cloudbrain.repo_id": opts.RepoID},
  874. )
  875. }
  876. if opts.UserID > 0 {
  877. cond = cond.And(
  878. builder.Eq{"cloudbrain.user_id": opts.UserID},
  879. )
  880. }
  881. if (opts.Type) >= 0 {
  882. cond = cond.And(
  883. builder.Eq{"cloudbrain.type": opts.Type},
  884. )
  885. }
  886. if (opts.JobID) != "" {
  887. cond = cond.And(
  888. builder.Eq{"cloudbrain.job_id": opts.JobID},
  889. )
  890. }
  891. if (opts.JobType) != "" {
  892. cond = cond.And(
  893. builder.Eq{"cloudbrain.job_type": opts.JobType},
  894. )
  895. }
  896. if len(opts.CloudbrainIDs) > 0 {
  897. cond = cond.And(builder.In("cloudbrain.id", opts.CloudbrainIDs))
  898. }
  899. count, err := sess.Where(cond).Count(new(Cloudbrain))
  900. if err != nil {
  901. return nil, 0, fmt.Errorf("Count: %v", err)
  902. }
  903. if opts.Page >= 0 && opts.PageSize > 0 {
  904. var start int
  905. if opts.Page == 0 {
  906. start = 0
  907. } else {
  908. start = (opts.Page - 1) * opts.PageSize
  909. }
  910. sess.Limit(opts.PageSize, start)
  911. }
  912. sess.OrderBy("cloudbrain.created_unix DESC")
  913. cloudbrains := make([]*CloudbrainInfo, 0, setting.UI.IssuePagingNum)
  914. if err := sess.Table(&Cloudbrain{}).Where(cond).
  915. Join("left", "`user`", "cloudbrain.user_id = `user`.id").
  916. Find(&cloudbrains); err != nil {
  917. return nil, 0, fmt.Errorf("Find: %v", err)
  918. }
  919. sess.Close()
  920. return cloudbrains, count, nil
  921. }
  922. func CreateCloudbrain(cloudbrain *Cloudbrain) (err error) {
  923. if _, err = x.Insert(cloudbrain); err != nil {
  924. return err
  925. }
  926. return nil
  927. }
  928. func CreateTrainjobConfigDetail(trainjobConfigDetail *TrainjobConfigDetail) (err error) {
  929. if _, err = x.Insert(trainjobConfigDetail); err != nil {
  930. return err
  931. }
  932. return nil
  933. }
  934. func getRepoCloudBrain(cb *Cloudbrain) (*Cloudbrain, error) {
  935. has, err := x.Get(cb)
  936. if err != nil {
  937. return nil, err
  938. } else if !has {
  939. return nil, ErrJobNotExist{}
  940. }
  941. return cb, nil
  942. }
  943. func GetRepoCloudBrainByJobID(repoID int64, jobID string) (*Cloudbrain, error) {
  944. cb := &Cloudbrain{JobID: jobID, RepoID: repoID}
  945. return getRepoCloudBrain(cb)
  946. }
  947. func GetCloudbrainByJobID(jobID string) (*Cloudbrain, error) {
  948. cb := &Cloudbrain{JobID: jobID}
  949. return getRepoCloudBrain(cb)
  950. }
  951. func GetCloudbrainByJobIDAndVersionName(jobID string, versionName string) (*Cloudbrain, error) {
  952. cb := &Cloudbrain{JobID: jobID, VersionName: versionName}
  953. return getRepoCloudBrain(cb)
  954. }
  955. func GetCloudbrainByJobIDAndIsLatestVersion(jobID string, isLatestVersion string) (*Cloudbrain, error) {
  956. cb := &Cloudbrain{JobID: jobID, IsLatestVersion: isLatestVersion}
  957. return getRepoCloudBrain(cb)
  958. }
  959. func GetCloudbrainsNeededStopByUserID(userID int64) ([]*Cloudbrain, error) {
  960. cloudBrains := make([]*Cloudbrain, 0)
  961. err := x.Cols("job_id", "status", "type").Where("user_id=? AND status !=?", userID, string(JobStopped)).Find(&cloudBrains)
  962. return cloudBrains, err
  963. }
  964. func GetCloudbrainsNeededStopByRepoID(repoID int64) ([]*Cloudbrain, error) {
  965. cloudBrains := make([]*Cloudbrain, 0)
  966. err := x.Cols("job_id", "status", "type").Where("repo_id=? AND status !=?", repoID, string(JobStopped)).Find(&cloudBrains)
  967. return cloudBrains, err
  968. }
  969. func SetCloudbrainStatusByJobID(jobID string, status CloudbrainStatus) (err error) {
  970. cb := &Cloudbrain{JobID: jobID, Status: string(status)}
  971. _, err = x.Cols("status").Where("cloudbrain.job_id=?", jobID).Update(cb)
  972. return
  973. }
  974. func SetTrainJobStatusByJobID(jobID string, status string, duration int64, trainjobduration string) (err error) {
  975. cb := &Cloudbrain{JobID: jobID, Status: string(status), Duration: duration, TrainJobDuration: trainjobduration}
  976. _, err = x.Cols("status", "duration", "train_job_duration").Where("cloudbrain.job_id=?", jobID).Update(cb)
  977. return
  978. }
  979. func SetVersionCountAndLatestVersionByJobIDAndVersionName(jobID string, versionName string, versionCount int64, isLatestVersion string) (err error) {
  980. cb := &Cloudbrain{JobID: jobID, VersionName: versionName, VersionCount: versionCount, IsLatestVersion: isLatestVersion}
  981. _, err = x.Cols("version_Count", "is_latest_version").Where("cloudbrain.job_id=? AND cloudbrain.version_name=?", jobID, versionName).Update(cb)
  982. return
  983. }
  984. func UpdateJob(job *Cloudbrain) error {
  985. return updateJob(x, job)
  986. }
  987. func updateJob(e Engine, job *Cloudbrain) error {
  988. var sess *xorm.Session
  989. sess = e.Where("job_id = ?", job.JobID)
  990. _, err := sess.Cols("status", "container_id", "container_ip").Update(job)
  991. return err
  992. }
  993. // func UpdateTrainJob(job *CloudbrainInfo) error {
  994. // return updateTrainJob(x, job)
  995. // }
  996. // func updateTrainJob(e Engine, job *CloudbrainInfo) error {
  997. // var sess *xorm.Session
  998. // sess = e.Where("job_id = ?", job.Cloudbrain.JobID)
  999. // _, err := sess.Cols("status", "container_id", "container_ip").Update(job)
  1000. // return err
  1001. // }
  1002. func DeleteJob(job *Cloudbrain) error {
  1003. return deleteJob(x, job)
  1004. }
  1005. func deleteJob(e Engine, job *Cloudbrain) error {
  1006. _, err := e.ID(job.ID).Delete(job)
  1007. return err
  1008. }
  1009. func GetCloudbrainByName(jobName string) (*Cloudbrain, error) {
  1010. cb := &Cloudbrain{JobName: jobName}
  1011. return getRepoCloudBrain(cb)
  1012. }
  1013. func CanDelJob(isSigned bool, user *User, job *CloudbrainInfo) bool {
  1014. if !isSigned || (job.Status != string(JobStopped) && job.Status != string(JobFailed) && job.Status != string(ModelArtsStartFailed) && job.Status != string(ModelArtsCreateFailed)) {
  1015. return false
  1016. }
  1017. repo, err := GetRepositoryByID(job.RepoID)
  1018. if err != nil {
  1019. log.Error("GetRepositoryByID failed:%v", err.Error())
  1020. return false
  1021. }
  1022. permission, _ := GetUserRepoPermission(repo, user)
  1023. if err != nil {
  1024. log.Error("GetUserRepoPermission failed:%v", err.Error())
  1025. return false
  1026. }
  1027. if (user.ID == job.UserID && permission.AccessMode >= AccessModeWrite) || user.IsAdmin || permission.AccessMode >= AccessModeAdmin {
  1028. return true
  1029. }
  1030. return false
  1031. }