You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

resource_specification.go 16 kB

2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago

  1. package models
  2. import (
  3. "code.gitea.io/gitea/modules/timeutil"
  4. "fmt"
  5. "xorm.io/builder"
  6. )
  7. const (
  8. SpecNotVerified int = iota + 1
  9. SpecOnShelf
  10. SpecOffShelf
  11. )
  12. type SearchSpecOrderBy int
  13. const (
  14. SearchSpecOrderById SearchSpecOrderBy = iota
  15. SearchSpecOrder4Standard
  16. )
  17. type ResourceSpecification struct {
  18. ID int64 `xorm:"pk autoincr"`
  19. QueueId int64 `xorm:"INDEX"`
  20. SourceSpecId string `xorm:"INDEX"`
  21. AccCardsNum int
  22. CpuCores int
  23. MemGiB float32
  24. GPUMemGiB float32
  25. ShareMemGiB float32
  26. UnitPrice int
  27. Status int
  28. IsAvailable bool
  29. IsAutomaticSync bool
  30. CreatedTime timeutil.TimeStamp `xorm:"created"`
  31. CreatedBy int64
  32. UpdatedTime timeutil.TimeStamp `xorm:"updated"`
  33. UpdatedBy int64
  34. }
  35. func (r ResourceSpecification) ConvertToRes() *ResourceSpecificationRes {
  36. return &ResourceSpecificationRes{
  37. ID: r.ID,
  38. SourceSpecId: r.SourceSpecId,
  39. AccCardsNum: r.AccCardsNum,
  40. CpuCores: r.CpuCores,
  41. MemGiB: r.MemGiB,
  42. ShareMemGiB: r.ShareMemGiB,
  43. GPUMemGiB: r.GPUMemGiB,
  44. UnitPrice: r.UnitPrice,
  45. Status: r.Status,
  46. IsAvailable: r.IsAvailable,
  47. UpdatedTime: r.UpdatedTime,
  48. }
  49. }
  50. type ResourceSpecificationReq struct {
  51. QueueId int64 `binding:"Required"`
  52. SourceSpecId string
  53. AccCardsNum int
  54. CpuCores int
  55. MemGiB float32
  56. GPUMemGiB float32
  57. ShareMemGiB float32
  58. UnitPrice int
  59. Status int
  60. IsAutomaticSync bool
  61. CreatorId int64
  62. }
  63. func (r ResourceSpecificationReq) ToDTO() ResourceSpecification {
  64. return ResourceSpecification{
  65. QueueId: r.QueueId,
  66. SourceSpecId: r.SourceSpecId,
  67. AccCardsNum: r.AccCardsNum,
  68. CpuCores: r.CpuCores,
  69. MemGiB: r.MemGiB,
  70. GPUMemGiB: r.GPUMemGiB,
  71. ShareMemGiB: r.ShareMemGiB,
  72. UnitPrice: r.UnitPrice,
  73. Status: r.Status,
  74. IsAutomaticSync: r.IsAutomaticSync,
  75. CreatedBy: r.CreatorId,
  76. UpdatedBy: r.CreatorId,
  77. IsAvailable: true,
  78. }
  79. }
  80. type SearchResourceSpecificationOptions struct {
  81. ListOptions
  82. QueueId int64
  83. Status int
  84. Cluster string
  85. AvailableCode int
  86. OrderBy SearchSpecOrderBy
  87. }
  88. type SearchResourceBriefSpecificationOptions struct {
  89. QueueId int64
  90. Cluster string
  91. }
  92. type ResourceSpecAndQueueListRes struct {
  93. TotalSize int64
  94. List []*ResourceSpecAndQueueRes
  95. }
  96. func NewResourceSpecAndQueueListRes(totalSize int64, list []ResourceSpecAndQueue) *ResourceSpecAndQueueListRes {
  97. resList := make([]*ResourceSpecAndQueueRes, len(list))
  98. for i, v := range list {
  99. resList[i] = v.ConvertToRes()
  100. }
  101. return &ResourceSpecAndQueueListRes{
  102. TotalSize: totalSize,
  103. List: resList,
  104. }
  105. }
  106. type ResourceSpecificationRes struct {
  107. ID int64
  108. SourceSpecId string
  109. AccCardsNum int
  110. CpuCores int
  111. MemGiB float32
  112. GPUMemGiB float32
  113. ShareMemGiB float32
  114. UnitPrice int
  115. Status int
  116. IsAvailable bool
  117. UpdatedTime timeutil.TimeStamp
  118. }
  119. func (ResourceSpecificationRes) TableName() string {
  120. return "resource_specification"
  121. }
  122. type ResourceSpecAndQueueRes struct {
  123. Spec *ResourceSpecificationRes
  124. Queue *ResourceQueueRes
  125. }
  126. type ResourceSpecAndQueue struct {
  127. ResourceSpecification `xorm:"extends"`
  128. ResourceQueue `xorm:"extends"`
  129. }
  130. func (*ResourceSpecAndQueue) TableName() string {
  131. return "resource_specification"
  132. }
  133. func (r ResourceSpecAndQueue) ConvertToRes() *ResourceSpecAndQueueRes {
  134. return &ResourceSpecAndQueueRes{
  135. Spec: r.ResourceSpecification.ConvertToRes(),
  136. Queue: r.ResourceQueue.ConvertToRes(),
  137. }
  138. }
  139. type FindSpecsOptions struct {
  140. JobType JobType
  141. ComputeResource string
  142. Cluster string
  143. AiCenterCode string
  144. SpecId int64
  145. QueueCode string
  146. SourceSpecId string
  147. AccCardsNum int
  148. UseAccCardsNum bool
  149. AccCardType string
  150. CpuCores int
  151. UseCpuCores bool
  152. MemGiB float32
  153. UseMemGiB bool
  154. GPUMemGiB float32
  155. UseGPUMemGiB bool
  156. ShareMemGiB float32
  157. UseShareMemGiB bool
  158. //if true,find specs no matter used or not used in scene. if false,only find specs used in scene
  159. RequestAll bool
  160. SpecStatus int
  161. }
  162. type Specification struct {
  163. ID int64
  164. SourceSpecId string
  165. AccCardsNum int
  166. AccCardType string
  167. CpuCores int
  168. MemGiB float32
  169. GPUMemGiB float32
  170. ShareMemGiB float32
  171. ComputeResource string
  172. UnitPrice int
  173. QueueId int64
  174. QueueCode string
  175. Cluster string
  176. AiCenterCode string
  177. AiCenterName string
  178. IsExclusive bool
  179. ExclusiveOrg string
  180. }
  181. func (Specification) TableName() string {
  182. return "resource_specification"
  183. }
  184. func InsertResourceSpecification(r ResourceSpecification) (int64, error) {
  185. return x.Insert(&r)
  186. }
  187. func UpdateResourceSpecificationById(queueId int64, spec ResourceSpecification) (int64, error) {
  188. return x.ID(queueId).Update(&spec)
  189. }
  190. func UpdateSpecUnitPriceById(id int64, unitPrice int) error {
  191. _, err := x.Exec("update resource_specification set unit_price = ? ,updated_time = ? where id = ?", unitPrice, timeutil.TimeStampNow(), id)
  192. return err
  193. }
  194. func SearchResourceSpecification(opts SearchResourceSpecificationOptions) (int64, []ResourceSpecAndQueue, error) {
  195. var cond = builder.NewCond()
  196. if opts.Page <= 0 {
  197. opts.Page = 1
  198. }
  199. if opts.QueueId > 0 {
  200. cond = cond.And(builder.Eq{"resource_specification.queue_id": opts.QueueId})
  201. }
  202. if opts.Status > 0 {
  203. cond = cond.And(builder.Eq{"resource_specification.status": opts.Status})
  204. }
  205. if opts.Cluster != "" {
  206. cond = cond.And(builder.Eq{"resource_queue.cluster": opts.Cluster})
  207. }
  208. if opts.AvailableCode == 1 {
  209. cond = cond.And(builder.Eq{"resource_specification.is_available": true})
  210. } else if opts.AvailableCode == 2 {
  211. cond = cond.And(builder.Eq{"resource_specification.is_available": false})
  212. }
  213. //cond = cond.And(builder.Or(builder.Eq{"resource_queue.deleted_time": 0}).Or(builder.IsNull{"resource_queue.deleted_time"}))
  214. n, err := x.Where(cond).Join("INNER", "resource_queue", "resource_queue.ID = resource_specification.queue_id").
  215. Unscoped().Count(&ResourceSpecAndQueue{})
  216. if err != nil {
  217. return 0, nil, err
  218. }
  219. var orderby = ""
  220. switch opts.OrderBy {
  221. case SearchSpecOrder4Standard:
  222. orderby = "resource_queue.compute_resource asc,resource_queue.acc_card_type asc,resource_specification.acc_cards_num asc,resource_specification.cpu_cores asc,resource_specification.mem_gi_b asc,resource_specification.share_mem_gi_b asc"
  223. default:
  224. orderby = "resource_specification.id desc"
  225. }
  226. r := make([]ResourceSpecAndQueue, 0)
  227. err = x.Where(cond).
  228. Join("INNER", "resource_queue", "resource_queue.ID = resource_specification.queue_id").
  229. OrderBy(orderby).
  230. Limit(opts.PageSize, (opts.Page-1)*opts.PageSize).
  231. Unscoped().Find(&r)
  232. if err != nil {
  233. return 0, nil, err
  234. }
  235. return n, r, nil
  236. }
  237. func GetSpecScenes(specId int64) ([]ResourceSceneBriefRes, error) {
  238. r := make([]ResourceSceneBriefRes, 0)
  239. err := x.Where("resource_scene_spec.spec_id = ?", specId).
  240. Join("INNER", "resource_scene_spec", "resource_scene_spec.scene_id = resource_scene.id").
  241. Find(&r)
  242. if err != nil {
  243. return nil, err
  244. }
  245. return r, nil
  246. }
  247. func ResourceSpecOnShelf(id int64, unitPrice int) error {
  248. _, err := x.Exec("update resource_specification set unit_price = ?,updated_time = ?,status = ? where id = ?", unitPrice, timeutil.TimeStampNow(), SpecOnShelf, id)
  249. return err
  250. }
  251. func ResourceSpecOffShelf(id int64) (int64, error) {
  252. sess := x.NewSession()
  253. var err error
  254. defer func() {
  255. if err != nil {
  256. sess.Rollback()
  257. }
  258. sess.Close()
  259. }()
  260. param := ResourceSpecification{
  261. Status: SpecOffShelf,
  262. }
  263. n, err := sess.Where("id = ? and status = ?", id, SpecOnShelf).Update(&param)
  264. if err != nil {
  265. return 0, err
  266. }
  267. sess.Commit()
  268. return n, err
  269. }
  270. func GetResourceSpecificationByIds(ids []int64) ([]*Specification, error) {
  271. r := make([]*Specification, 0)
  272. err := x.In("resource_specification.id", ids).
  273. Join("INNER", "resource_queue", "resource_queue.id = resource_specification.queue_id").
  274. Find(&r)
  275. return r, err
  276. }
  277. func GetResourceSpecification(r *ResourceSpecification) (*ResourceSpecification, error) {
  278. has, err := x.Get(r)
  279. if err != nil {
  280. return nil, err
  281. } else if !has {
  282. return nil, nil
  283. }
  284. return r, nil
  285. }
  286. func SyncGrampusSpecs(updateList []ResourceSpecification, insertList []ResourceSpecification, existIds []int64) error {
  287. sess := x.NewSession()
  288. var err error
  289. defer func() {
  290. if err != nil {
  291. sess.Rollback()
  292. }
  293. sess.Close()
  294. }()
  295. //delete specs and scene that no longer exists
  296. deleteIds := make([]int64, 0)
  297. cond := builder.NewCond()
  298. cond = cond.And(builder.NotIn("resource_specification.id", existIds)).And(builder.Eq{"resource_queue.cluster": C2NetCluster})
  299. if err := sess.Cols("resource_specification.id").Table("resource_specification").
  300. Where(cond).Join("INNER", "resource_queue", "resource_queue.id = resource_specification.queue_id").
  301. Find(&deleteIds); err != nil {
  302. return err
  303. }
  304. if len(deleteIds) > 0 {
  305. if _, err = sess.Cols("status", "is_available").In("id", deleteIds).Update(&ResourceSpecification{Status: SpecOffShelf, IsAvailable: false}); err != nil {
  306. return err
  307. }
  308. }
  309. //update exists specs
  310. if len(updateList) > 0 {
  311. for _, v := range updateList {
  312. if _, err = sess.ID(v.ID).UseBool("is_available").Update(&v); err != nil {
  313. return err
  314. }
  315. }
  316. }
  317. //insert new specs
  318. if len(insertList) > 0 {
  319. if _, err = sess.Insert(insertList); err != nil {
  320. return err
  321. }
  322. }
  323. return sess.Commit()
  324. }
  325. //FindSpecs
  326. func FindSpecs(opts FindSpecsOptions) ([]*Specification, error) {
  327. var cond = builder.NewCond()
  328. if !opts.RequestAll && opts.JobType != "" {
  329. cond = cond.And(builder.Eq{"resource_scene.job_type": opts.JobType})
  330. }
  331. if opts.ComputeResource != "" {
  332. cond = cond.And(builder.Eq{"resource_queue.compute_resource": opts.ComputeResource})
  333. }
  334. if opts.Cluster != "" {
  335. cond = cond.And(builder.Eq{"resource_queue.cluster": opts.Cluster})
  336. }
  337. if opts.AiCenterCode != "" {
  338. cond = cond.And(builder.Eq{"resource_queue.ai_center_code": opts.AiCenterCode})
  339. }
  340. if opts.SpecId > 0 {
  341. cond = cond.And(builder.Eq{"resource_specification.id": opts.SpecId})
  342. }
  343. if opts.QueueCode != "" {
  344. cond = cond.And(builder.Eq{"resource_queue.queue_code": opts.QueueCode})
  345. }
  346. if opts.SourceSpecId != "" {
  347. cond = cond.And(builder.Eq{"resource_specification.source_spec_id": opts.SourceSpecId})
  348. }
  349. if opts.UseAccCardsNum {
  350. cond = cond.And(builder.Eq{"resource_specification.acc_cards_num": opts.AccCardsNum})
  351. }
  352. if opts.AccCardType != "" {
  353. cond = cond.And(builder.Eq{"resource_queue.acc_card_type": opts.AccCardType})
  354. }
  355. if opts.UseCpuCores {
  356. cond = cond.And(builder.Eq{"resource_specification.cpu_cores": opts.CpuCores})
  357. }
  358. if opts.UseMemGiB {
  359. cond = cond.And(builder.Eq{"resource_specification.mem_gi_b": opts.MemGiB})
  360. }
  361. if opts.UseGPUMemGiB {
  362. cond = cond.And(builder.Eq{"resource_specification.gpu_mem_gi_b": opts.GPUMemGiB})
  363. }
  364. if opts.UseShareMemGiB {
  365. cond = cond.And(builder.Eq{"resource_specification.share_mem_gi_b": opts.ShareMemGiB})
  366. }
  367. if opts.SpecStatus > 0 {
  368. cond = cond.And(builder.Eq{"resource_specification.status": opts.SpecStatus})
  369. }
  370. r := make([]*Specification, 0)
  371. s := x.Where(cond).
  372. Join("INNER", "resource_queue", "resource_queue.id = resource_specification.queue_id")
  373. if !opts.RequestAll {
  374. s = s.Join("INNER", "resource_scene_spec", "resource_scene_spec.spec_id = resource_specification.id").
  375. Join("INNER", "resource_scene", "resource_scene_spec.scene_id = resource_scene.id")
  376. }
  377. err := s.OrderBy("resource_queue.compute_resource asc,resource_queue.acc_card_type asc,resource_specification.acc_cards_num asc,resource_specification.cpu_cores asc,resource_specification.mem_gi_b asc,resource_specification.share_mem_gi_b asc").
  378. Unscoped().Find(&r)
  379. if err != nil {
  380. return nil, err
  381. }
  382. return r, nil
  383. }
  384. func InitQueueAndSpec(queue ResourceQueue, spec ResourceSpecification) (*Specification, error) {
  385. sess := x.NewSession()
  386. defer sess.Close()
  387. sess.Begin()
  388. param := ResourceQueue{
  389. QueueCode: queue.QueueCode,
  390. Cluster: queue.Cluster,
  391. AiCenterCode: queue.AiCenterCode,
  392. ComputeResource: queue.ComputeResource,
  393. AccCardType: queue.AccCardType,
  394. }
  395. _, err := sess.Get(&param)
  396. if err != nil {
  397. sess.Rollback()
  398. return nil, err
  399. }
  400. if param.ID == 0 {
  401. _, err = sess.InsertOne(&queue)
  402. if err != nil {
  403. sess.Rollback()
  404. return nil, err
  405. }
  406. } else {
  407. queue = param
  408. }
  409. spec.QueueId = queue.ID
  410. _, err = sess.InsertOne(&spec)
  411. if err != nil {
  412. sess.Rollback()
  413. return nil, err
  414. }
  415. sess.Commit()
  416. return BuildSpecification(queue, spec), nil
  417. }
  418. func BuildSpecification(queue ResourceQueue, spec ResourceSpecification) *Specification {
  419. return &Specification{
  420. ID: spec.ID,
  421. SourceSpecId: spec.SourceSpecId,
  422. AccCardsNum: spec.AccCardsNum,
  423. AccCardType: queue.AccCardType,
  424. CpuCores: spec.CpuCores,
  425. MemGiB: spec.MemGiB,
  426. GPUMemGiB: spec.GPUMemGiB,
  427. ShareMemGiB: spec.ShareMemGiB,
  428. ComputeResource: queue.ComputeResource,
  429. UnitPrice: spec.UnitPrice,
  430. QueueId: queue.ID,
  431. QueueCode: queue.QueueCode,
  432. Cluster: queue.Cluster,
  433. AiCenterCode: queue.AiCenterCode,
  434. AiCenterName: queue.AiCenterName,
  435. }
  436. }
  437. func GetCloudbrainOneAccCardType(queueCode string) string {
  438. switch queueCode {
  439. case "a100":
  440. return "A100"
  441. case "openidebug":
  442. return "T4"
  443. case "openidgx":
  444. return "V100"
  445. }
  446. return ""
  447. }
  448. var cloudbrainTwoSpecsInitFlag = false
  449. var cloudbrainTwoSpecs map[string]*Specification
  450. func GetCloudbrainTwoSpecs() (map[string]*Specification, error) {
  451. if !cloudbrainTwoSpecsInitFlag {
  452. r, err := InitCloudbrainTwoSpecs()
  453. if err != nil {
  454. return nil, err
  455. }
  456. cloudbrainTwoSpecsInitFlag = true
  457. cloudbrainTwoSpecs = r
  458. }
  459. return cloudbrainTwoSpecs, nil
  460. }
  461. func InitCloudbrainTwoSpecs() (map[string]*Specification, error) {
  462. r := make(map[string]*Specification, 0)
  463. queue, err := GetResourceQueue(&ResourceQueue{QueueCode: "openisupport"})
  464. if err != nil {
  465. return nil, err
  466. }
  467. if queue == nil {
  468. queue = &ResourceQueue{
  469. QueueCode: "openisupport",
  470. Cluster: OpenICluster,
  471. AiCenterCode: AICenterOfCloudBrainTwo,
  472. AiCenterName: "云脑二",
  473. ComputeResource: NPU,
  474. AccCardType: "ASCEND910",
  475. Remark: "处理历史云脑任务时自动生成",
  476. }
  477. _, err = x.InsertOne(queue)
  478. if err != nil {
  479. return nil, err
  480. }
  481. }
  482. for i := 1; i <= 8; i = i * 2 {
  483. sourceSpecId := "modelarts.bm.910.arm.public." + fmt.Sprint(i)
  484. spec, err := GetResourceSpecification(&ResourceSpecification{
  485. SourceSpecId: sourceSpecId,
  486. QueueId: queue.ID,
  487. })
  488. if err != nil {
  489. return nil, err
  490. }
  491. if spec == nil {
  492. spec = &ResourceSpecification{
  493. QueueId: queue.ID,
  494. SourceSpecId: sourceSpecId,
  495. AccCardsNum: i,
  496. CpuCores: i * 24,
  497. MemGiB: float32(i * 256),
  498. GPUMemGiB: float32(32),
  499. Status: SpecOffShelf,
  500. IsAvailable: true,
  501. }
  502. _, err = x.Insert(spec)
  503. if err != nil {
  504. return nil, err
  505. }
  506. }
  507. r[sourceSpecId] = BuildSpecification(*queue, *spec)
  508. }
  509. return r, nil
  510. }
  511. var grampusSpecsInitFlag = false
  512. var grampusSpecs map[string]*Specification
  513. func GetGrampusSpecs() (map[string]*Specification, error) {
  514. if !grampusSpecsInitFlag {
  515. specMap := make(map[string]*Specification, 0)
  516. r, err := FindSpecs(FindSpecsOptions{
  517. Cluster: C2NetCluster,
  518. RequestAll: true,
  519. })
  520. if err != nil {
  521. return nil, err
  522. }
  523. for _, spec := range r {
  524. specMap[spec.SourceSpecId] = spec
  525. specMap[spec.SourceSpecId+"_"+spec.AiCenterCode] = spec
  526. }
  527. grampusSpecsInitFlag = true
  528. grampusSpecs = specMap
  529. }
  530. return grampusSpecs, nil
  531. }