You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

modelarts.go 11 kB

3 years ago
4 years ago
3 years ago
3 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
3 years ago
3 years ago
3 years ago
4 years ago
3 years ago
4 years ago
3 years ago
3 years ago
3 years ago
3 years ago
4 years ago
4 years ago
3 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425
  1. // Copyright 2016 The Gogs Authors. All rights reserved.
  2. // Copyright 2018 The Gitea Authors. All rights reserved.
  3. // Use of this source code is governed by a MIT-style
  4. // license that can be found in the LICENSE file.
  5. package repo
  6. import (
  7. "net/http"
  8. "strconv"
  9. "strings"
  10. "code.gitea.io/gitea/modules/util"
  11. "code.gitea.io/gitea/models"
  12. "code.gitea.io/gitea/modules/context"
  13. "code.gitea.io/gitea/modules/log"
  14. "code.gitea.io/gitea/modules/modelarts"
  15. "code.gitea.io/gitea/modules/storage"
  16. routerRepo "code.gitea.io/gitea/routers/repo"
  17. )
  18. func GetModelArtsNotebook(ctx *context.APIContext) {
  19. var (
  20. err error
  21. )
  22. jobID := ctx.Params(":jobid")
  23. repoID := ctx.Repo.Repository.ID
  24. job, err := models.GetRepoCloudBrainByJobID(repoID, jobID)
  25. if err != nil {
  26. ctx.NotFound(err)
  27. return
  28. }
  29. result, err := modelarts.GetJob(jobID)
  30. if err != nil {
  31. ctx.NotFound(err)
  32. return
  33. }
  34. job.Status = result.Status
  35. err = models.UpdateJob(job)
  36. if err != nil {
  37. log.Error("UpdateJob failed:", err)
  38. }
  39. ctx.JSON(http.StatusOK, map[string]interface{}{
  40. "JobID": jobID,
  41. "JobStatus": result.Status,
  42. })
  43. }
  44. func GetModelArtsNotebook2(ctx *context.APIContext) {
  45. var (
  46. err error
  47. )
  48. jobID := ctx.Params(":jobid")
  49. repoID := ctx.Repo.Repository.ID
  50. job, err := models.GetRepoCloudBrainByJobID(repoID, jobID)
  51. if err != nil {
  52. ctx.NotFound(err)
  53. return
  54. }
  55. result, err := modelarts.GetNotebook2(jobID)
  56. if err != nil {
  57. ctx.NotFound(err)
  58. return
  59. }
  60. job.Status = result.Status
  61. err = models.UpdateJob(job)
  62. if err != nil {
  63. log.Error("UpdateJob failed:", err)
  64. }
  65. ctx.JSON(http.StatusOK, map[string]interface{}{
  66. "JobID": jobID,
  67. "JobName": job.JobName,
  68. "JobStatus": result.Status,
  69. })
  70. }
  71. func GetModelArtsTrainJob(ctx *context.APIContext) {
  72. var (
  73. err error
  74. )
  75. jobID := ctx.Params(":jobid")
  76. repoID := ctx.Repo.Repository.ID
  77. job, err := models.GetRepoCloudBrainByJobID(repoID, jobID)
  78. if err != nil {
  79. ctx.NotFound(err)
  80. return
  81. }
  82. result, err := modelarts.GetTrainJob(jobID, strconv.FormatInt(job.VersionID, 10))
  83. if err != nil {
  84. ctx.NotFound(err)
  85. return
  86. }
  87. job.Status = modelarts.TransTrainJobStatus(result.IntStatus)
  88. job.Duration = result.Duration
  89. job.TrainJobDuration = result.TrainJobDuration
  90. err = models.UpdateJob(job)
  91. if err != nil {
  92. log.Error("UpdateJob failed:", err)
  93. }
  94. ctx.JSON(http.StatusOK, map[string]interface{}{
  95. "JobID": jobID,
  96. "JobStatus": job.Status,
  97. "JobDuration": job.Duration,
  98. })
  99. }
  100. func GetModelArtsTrainJobVersion(ctx *context.APIContext) {
  101. var (
  102. err error
  103. )
  104. jobID := ctx.Params(":jobid")
  105. versionName := ctx.Query("version_name")
  106. job, err := models.GetCloudbrainByJobIDAndVersionName(jobID, versionName)
  107. if err != nil {
  108. ctx.NotFound(err)
  109. return
  110. }
  111. result, err := modelarts.GetTrainJob(jobID, strconv.FormatInt(job.VersionID, 10))
  112. if err != nil {
  113. ctx.NotFound(err)
  114. return
  115. }
  116. job.Status = modelarts.TransTrainJobStatus(result.IntStatus)
  117. job.Duration = result.Duration
  118. job.TrainJobDuration = result.TrainJobDuration
  119. if result.Duration != 0 {
  120. job.TrainJobDuration = util.AddZero(result.Duration/3600000) + ":" + util.AddZero(result.Duration%3600000/60000) + ":" + util.AddZero(result.Duration%60000/1000)
  121. } else {
  122. job.TrainJobDuration = "00:00:00"
  123. }
  124. err = models.UpdateTrainJobVersion(job)
  125. if err != nil {
  126. log.Error("UpdateJob failed:", err)
  127. }
  128. ctx.JSON(http.StatusOK, map[string]interface{}{
  129. "JobID": jobID,
  130. "JobStatus": job.Status,
  131. "JobDuration": job.TrainJobDuration,
  132. })
  133. }
  134. func TrainJobGetLog(ctx *context.APIContext) {
  135. var (
  136. err error
  137. )
  138. var jobID = ctx.Params(":jobid")
  139. var versionName = ctx.Query("version_name")
  140. var baseLine = ctx.Query("base_line")
  141. var order = ctx.Query("order")
  142. var lines = ctx.Query("lines")
  143. lines_int, err := strconv.Atoi(lines)
  144. if err != nil {
  145. log.Error("change lines(%d) string to int failed", lines_int)
  146. }
  147. if order != modelarts.OrderDesc && order != modelarts.OrderAsc {
  148. log.Error("order(%s) check failed", order)
  149. ctx.JSON(http.StatusBadRequest, map[string]interface{}{
  150. "err_msg": "order check failed",
  151. })
  152. return
  153. }
  154. resultLogFile, result, err := trainJobGetLogContent(jobID, versionName, baseLine, order, lines_int)
  155. if err != nil {
  156. log.Error("trainJobGetLog(%s) failed:%v", jobID, err.Error())
  157. // ctx.RenderWithErr(err.Error(), tplModelArtsTrainJobShow, nil)
  158. return
  159. }
  160. ctx.Data["log_file_name"] = resultLogFile.LogFileList[0]
  161. ctx.JSON(http.StatusOK, map[string]interface{}{
  162. "JobID": jobID,
  163. "LogFileName": resultLogFile.LogFileList[0],
  164. "StartLine": result.StartLine,
  165. "EndLine": result.EndLine,
  166. "Content": result.Content,
  167. "Lines": result.Lines,
  168. })
  169. }
  170. func trainJobGetLogContent(jobID string, versionName string, baseLine string, order string, lines int) (*models.GetTrainJobLogFileNamesResult, *models.GetTrainJobLogResult, error) {
  171. task, err := models.GetCloudbrainByJobIDAndVersionName(jobID, versionName)
  172. if err != nil {
  173. log.Error("GetCloudbrainByJobID(%s) failed:%v", jobID, err.Error())
  174. return nil, nil, err
  175. }
  176. resultLogFile, err := modelarts.GetTrainJobLogFileNames(jobID, strconv.FormatInt(task.VersionID, 10))
  177. if err != nil {
  178. log.Error("GetTrainJobLogFileNames(%s) failed:%v", jobID, err.Error())
  179. return nil, nil, err
  180. }
  181. result, err := modelarts.GetTrainJobLog(jobID, strconv.FormatInt(task.VersionID, 10), baseLine, resultLogFile.LogFileList[0], order, lines)
  182. if err != nil {
  183. log.Error("GetTrainJobLog(%s) failed:%v", jobID, err.Error())
  184. return nil, nil, err
  185. }
  186. return resultLogFile, result, err
  187. }
  188. func DelTrainJobVersion(ctx *context.APIContext) {
  189. var (
  190. err error
  191. )
  192. var jobID = ctx.Params(":jobid")
  193. var versionName = ctx.Query("version_name")
  194. task, err := models.GetCloudbrainByJobIDAndVersionName(jobID, versionName)
  195. if err != nil {
  196. log.Error("GetCloudbrainByJobID(%s) failed:%v", task.JobName, err.Error())
  197. ctx.NotFound(err)
  198. return
  199. }
  200. //删除modelarts上的记录
  201. _, err = modelarts.DelTrainJobVersion(jobID, strconv.FormatInt(task.VersionID, 10))
  202. if err != nil {
  203. log.Error("DelTrainJobVersion(%s) failed:%v", task.JobName, err.Error())
  204. ctx.NotFound(err)
  205. return
  206. }
  207. //删除数据库记录
  208. err = models.DeleteJob(task)
  209. if err != nil {
  210. ctx.ServerError("DeleteJob failed", err)
  211. ctx.NotFound(err)
  212. return
  213. }
  214. //获取删除后的版本数量
  215. var jobTypes []string
  216. jobTypes = append(jobTypes, string(models.JobTypeTrain))
  217. repo := ctx.Repo.Repository
  218. VersionTaskList, VersionListCount, err := models.CloudbrainsVersionList(&models.CloudbrainsOptions{
  219. RepoID: repo.ID,
  220. Type: models.TypeCloudBrainTwo,
  221. JobTypes: jobTypes,
  222. JobID: jobID,
  223. })
  224. if err != nil {
  225. ctx.ServerError("get VersionListCount failed", err)
  226. return
  227. }
  228. if VersionListCount > 0 {
  229. // 判断当前删掉的任务是否是最新版本,若是,将排序后的TotalVersionCount置为删掉的最新版本的TotalVersionCount,若不是,按时间排序后的版本列表的第一个版本设置为最新版本,TotalVersionCount不变
  230. if task.IsLatestVersion == modelarts.IsLatestVersion {
  231. err = models.SetVersionCountAndLatestVersion(jobID, VersionTaskList[0].Cloudbrain.VersionName, VersionListCount, modelarts.IsLatestVersion, task.TotalVersionCount)
  232. if err != nil {
  233. ctx.ServerError("UpdateJobVersionCount failed", err)
  234. return
  235. }
  236. } else {
  237. err = models.SetVersionCountAndLatestVersion(jobID, VersionTaskList[0].VersionName, VersionListCount, modelarts.IsLatestVersion, VersionTaskList[0].Cloudbrain.TotalVersionCount)
  238. if err != nil {
  239. ctx.ServerError("UpdateJobVersionCount failed", err)
  240. return
  241. }
  242. }
  243. } else { //已删除该任务下的所有版本
  244. routerRepo.DeleteJobStorage(task.JobName)
  245. }
  246. ctx.JSON(http.StatusOK, map[string]interface{}{
  247. "JobID": jobID,
  248. "VersionName": versionName,
  249. "StatusOK": 0,
  250. "VersionListCount": VersionListCount,
  251. })
  252. }
  253. func StopTrainJobVersion(ctx *context.APIContext) {
  254. var (
  255. err error
  256. )
  257. var jobID = ctx.Params(":jobid")
  258. var versionName = ctx.Query("version_name")
  259. task, err := models.GetCloudbrainByJobIDAndVersionName(jobID, versionName)
  260. if err != nil {
  261. log.Error("GetCloudbrainByJobID(%s) failed:%v", task.JobName, err.Error())
  262. return
  263. }
  264. _, err = modelarts.StopTrainJob(jobID, strconv.FormatInt(task.VersionID, 10))
  265. if err != nil {
  266. log.Error("StopTrainJob(%s) failed:%v", task.JobName, err.Error())
  267. return
  268. }
  269. ctx.JSON(http.StatusOK, map[string]interface{}{
  270. "JobID": jobID,
  271. "VersionName": versionName,
  272. "StatusOK": 0,
  273. })
  274. }
  275. func ModelList(ctx *context.APIContext) {
  276. var (
  277. err error
  278. )
  279. var jobID = ctx.Params(":jobid")
  280. var versionName = ctx.Query("version_name")
  281. parentDir := ctx.Query("parentDir")
  282. dirArray := strings.Split(parentDir, "/")
  283. task, err := models.GetCloudbrainByJobIDAndVersionName(jobID, versionName)
  284. if err != nil {
  285. log.Error("GetCloudbrainByJobID(%s) failed:%v", task.JobName, err.Error())
  286. return
  287. }
  288. models, err := storage.GetObsListObject(task.JobName, "output/", parentDir, versionName)
  289. if err != nil {
  290. log.Info("get TrainJobListModel failed:", err)
  291. ctx.ServerError("GetObsListObject:", err)
  292. return
  293. }
  294. ctx.JSON(http.StatusOK, map[string]interface{}{
  295. "JobID": jobID,
  296. "VersionName": versionName,
  297. "StatusOK": 0,
  298. "Path": dirArray,
  299. "Dirs": models,
  300. "task": task,
  301. "PageIsCloudBrain": true,
  302. })
  303. }
  304. func GetModelArtsInferenceJob(ctx *context.APIContext) {
  305. var (
  306. err error
  307. )
  308. jobID := ctx.Params(":jobid")
  309. job, err := models.GetCloudbrainByJobID(jobID)
  310. if err != nil {
  311. ctx.NotFound(err)
  312. return
  313. }
  314. result, err := modelarts.GetTrainJob(jobID, strconv.FormatInt(job.VersionID, 10))
  315. if err != nil {
  316. ctx.NotFound(err)
  317. return
  318. }
  319. job.Status = modelarts.TransTrainJobStatus(result.IntStatus)
  320. job.Duration = result.Duration
  321. job.TrainJobDuration = result.TrainJobDuration
  322. if result.Duration != 0 {
  323. job.TrainJobDuration = util.AddZero(result.Duration/3600000) + ":" + util.AddZero(result.Duration%3600000/60000) + ":" + util.AddZero(result.Duration%60000/1000)
  324. } else {
  325. job.TrainJobDuration = "00:00:00"
  326. }
  327. err = models.UpdateInferenceJob(job)
  328. if err != nil {
  329. log.Error("UpdateJob failed:", err)
  330. }
  331. ctx.JSON(http.StatusOK, map[string]interface{}{
  332. "JobID": jobID,
  333. "JobStatus": job.Status,
  334. "JobDuration": job.TrainJobDuration,
  335. })
  336. }
  337. func ResultList(ctx *context.APIContext) {
  338. var (
  339. err error
  340. )
  341. var jobID = ctx.Params(":jobid")
  342. var versionName = ctx.Query("version_name")
  343. parentDir := ctx.Query("parentDir")
  344. dirArray := strings.Split(parentDir, "/")
  345. task, err := models.GetCloudbrainByJobIDAndVersionName(jobID, versionName)
  346. if err != nil {
  347. log.Error("GetCloudbrainByJobID(%s) failed:%v", task.JobName, err.Error())
  348. return
  349. }
  350. models, err := storage.GetObsListObject(task.JobName, "result/", parentDir, versionName)
  351. if err != nil {
  352. log.Info("get TrainJobListModel failed:", err)
  353. ctx.ServerError("GetObsListObject:", err)
  354. return
  355. }
  356. ctx.JSON(http.StatusOK, map[string]interface{}{
  357. "JobID": jobID,
  358. "VersionName": versionName,
  359. "StatusOK": 0,
  360. "Path": dirArray,
  361. "Dirs": models,
  362. "task": task,
  363. "PageIsCloudBrain": true,
  364. })
  365. }