You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

resty.go 36 kB

4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
3 years ago
3 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
3 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218
  1. package modelarts
  2. import (
  3. "crypto/tls"
  4. "encoding/json"
  5. "fmt"
  6. "net/http"
  7. "strconv"
  8. "code.gitea.io/gitea/models"
  9. "code.gitea.io/gitea/modules/log"
  10. "code.gitea.io/gitea/modules/setting"
  11. "github.com/go-resty/resty/v2"
  12. )
  13. var (
  14. restyClient *resty.Client
  15. HOST string
  16. TOKEN string
  17. )
  18. const (
  19. methodPassword = "password"
  20. urlGetToken = "/v3/auth/tokens"
  21. urlNotebook = "/demanager/instances"
  22. urlTrainJob = "/training-jobs"
  23. urlResourceSpecs = "/job/resource-specs"
  24. urlTrainJobConfig = "/training-job-configs"
  25. errorCodeExceedLimit = "ModelArts.0118"
  26. //notebook 2.0
  27. urlNotebook2 = "/notebooks"
  28. //error code
  29. modelartsIllegalToken = "ModelArts.6401"
  30. NotebookNotFound = "ModelArts.6404"
  31. NotebookNoPermission = "ModelArts.6407"
  32. NotebookInvalid = "ModelArts.6400"
  33. )
  34. func getRestyClient() *resty.Client {
  35. if restyClient == nil {
  36. restyClient = resty.New()
  37. restyClient.SetTLSClientConfig(&tls.Config{InsecureSkipVerify: true})
  38. }
  39. return restyClient
  40. }
  41. func checkSetting() {
  42. if len(HOST) != 0 && len(TOKEN) != 0 && restyClient != nil {
  43. return
  44. }
  45. err := getToken()
  46. if err != nil {
  47. log.Error("getToken failed:%v", err)
  48. }
  49. }
  50. func getToken() error {
  51. HOST = setting.ModelArtsHost
  52. client := getRestyClient()
  53. params := models.GetTokenParams{
  54. Auth: models.Auth{
  55. Identity: models.Identity{
  56. Methods: []string{methodPassword},
  57. Password: models.Password{
  58. User: models.NotebookUser{
  59. Name: setting.ModelArtsUsername,
  60. Password: setting.ModelArtsPassword,
  61. Domain: models.Domain{
  62. Name: setting.ModelArtsDomain,
  63. },
  64. },
  65. },
  66. },
  67. Scope: models.Scope{
  68. Project: models.Project{
  69. Name: setting.ProjectName,
  70. },
  71. },
  72. },
  73. }
  74. res, err := client.R().
  75. SetHeader("Content-Type", "application/json").
  76. SetBody(params).
  77. Post(setting.IamHost + urlGetToken)
  78. if err != nil {
  79. return fmt.Errorf("resty getToken: %v", err)
  80. }
  81. if res.StatusCode() != http.StatusCreated {
  82. return fmt.Errorf("getToken failed:%s", res.String())
  83. }
  84. TOKEN = res.Header().Get("X-Subject-Token")
  85. return nil
  86. }
  87. func CreateJob(createJobParams models.CreateNotebookParams) (*models.CreateNotebookResult, error) {
  88. checkSetting()
  89. client := getRestyClient()
  90. var result models.CreateNotebookResult
  91. retry := 0
  92. sendjob:
  93. res, err := client.R().
  94. SetHeader("Content-Type", "application/json").
  95. SetAuthToken(TOKEN).
  96. SetBody(createJobParams).
  97. SetResult(&result).
  98. Post(HOST + "/v1/" + setting.ProjectID + urlNotebook)
  99. if err != nil {
  100. return nil, fmt.Errorf("resty create notebook: %s", err)
  101. }
  102. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  103. retry++
  104. _ = getToken()
  105. goto sendjob
  106. }
  107. var response models.NotebookResult
  108. err = json.Unmarshal(res.Body(), &response)
  109. if err != nil {
  110. log.Error("json.Unmarshal failed: %s", err.Error())
  111. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  112. }
  113. if len(response.ErrorCode) != 0 {
  114. log.Error("createNotebook failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  115. if response.ErrorCode == errorCodeExceedLimit {
  116. response.ErrorMsg = "所选规格使用数量已超过最大配额限制。"
  117. }
  118. return &result, fmt.Errorf("createNotebook failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  119. }
  120. return &result, nil
  121. }
  122. func GetJob(jobID string) (*models.GetNotebookResult, error) {
  123. checkSetting()
  124. client := getRestyClient()
  125. var result models.GetNotebookResult
  126. retry := 0
  127. sendjob:
  128. res, err := client.R().
  129. SetHeader("Content-Type", "application/json").
  130. SetAuthToken(TOKEN).
  131. SetResult(&result).
  132. Get(HOST + "/v1/" + setting.ProjectID + urlNotebook + "/" + jobID)
  133. if err != nil {
  134. return nil, fmt.Errorf("resty GetJob: %v", err)
  135. }
  136. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  137. retry++
  138. _ = getToken()
  139. goto sendjob
  140. }
  141. var response models.NotebookResult
  142. err = json.Unmarshal(res.Body(), &response)
  143. if err != nil {
  144. log.Error("json.Unmarshal failed: %s", err.Error())
  145. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  146. }
  147. if len(response.ErrorCode) != 0 {
  148. log.Error("GetJob failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  149. return &result, fmt.Errorf("GetJob failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  150. }
  151. return &result, nil
  152. }
  153. func GetNotebook2(jobID string) (*models.GetNotebook2Result, error) {
  154. checkSetting()
  155. client := getRestyClient()
  156. var result models.GetNotebook2Result
  157. retry := 0
  158. sendjob:
  159. res, err := client.R().
  160. SetHeader("Content-Type", "application/json").
  161. SetAuthToken(TOKEN).
  162. SetResult(&result).
  163. Get(HOST + "/v1/" + setting.ProjectID + urlNotebook2 + "/" + jobID)
  164. if err != nil {
  165. return nil, fmt.Errorf("resty GetJob: %v", err)
  166. }
  167. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  168. retry++
  169. _ = getToken()
  170. goto sendjob
  171. }
  172. var response models.NotebookResult
  173. err = json.Unmarshal(res.Body(), &response)
  174. if err != nil {
  175. log.Error("json.Unmarshal failed: %s", err.Error())
  176. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  177. }
  178. if len(response.ErrorCode) != 0 {
  179. log.Error("GetJob failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  180. if response.ErrorCode == modelartsIllegalToken && retry < 1 {
  181. retry++
  182. _ = getToken()
  183. goto sendjob
  184. }
  185. return &result, fmt.Errorf("GetJob failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  186. }
  187. return &result, nil
  188. }
  189. func ManageNotebook(jobID string, param models.NotebookAction) (*models.NotebookActionResult, error) {
  190. checkSetting()
  191. client := getRestyClient()
  192. var result models.NotebookActionResult
  193. retry := 0
  194. sendjob:
  195. res, err := client.R().
  196. SetHeader("Content-Type", "application/json").
  197. SetBody(param).
  198. SetAuthToken(TOKEN).
  199. SetResult(&result).
  200. Post(HOST + "/v1/" + setting.ProjectID + urlNotebook + "/" + jobID + "/action")
  201. if err != nil {
  202. return &result, fmt.Errorf("resty StopJob: %v", err)
  203. }
  204. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  205. retry++
  206. _ = getToken()
  207. goto sendjob
  208. }
  209. var response models.NotebookResult
  210. err = json.Unmarshal(res.Body(), &response)
  211. if err != nil {
  212. log.Error("json.Unmarshal failed: %s", err.Error())
  213. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  214. }
  215. if len(response.ErrorCode) != 0 {
  216. log.Error("ManageNotebook failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  217. return &result, fmt.Errorf("ManageNotebook failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  218. }
  219. return &result, nil
  220. }
  221. func ManageNotebook2(jobID string, param models.NotebookAction) (*models.NotebookActionResult, error) {
  222. checkSetting()
  223. client := getRestyClient()
  224. var result models.NotebookActionResult
  225. retry := 0
  226. sendjob:
  227. res, err := client.R().
  228. SetHeader("Content-Type", "application/json").
  229. SetAuthToken(TOKEN).
  230. SetResult(&result).
  231. Post(HOST + "/v1/" + setting.ProjectID + urlNotebook2 + "/" + jobID + "/" + param.Action + "?duration=" + strconv.Itoa(autoStopDurationMs))
  232. if err != nil {
  233. return &result, fmt.Errorf("resty ManageNotebook2: %v", err)
  234. }
  235. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  236. retry++
  237. _ = getToken()
  238. goto sendjob
  239. }
  240. var response models.NotebookResult
  241. err = json.Unmarshal(res.Body(), &response)
  242. if err != nil {
  243. log.Error("json.Unmarshal failed: %s", err.Error())
  244. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  245. }
  246. if len(response.ErrorCode) != 0 {
  247. log.Error("ManageNotebook2 failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  248. if response.ErrorCode == modelartsIllegalToken && retry < 1 {
  249. retry++
  250. _ = getToken()
  251. goto sendjob
  252. }
  253. return &result, fmt.Errorf("ManageNotebook2 failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  254. }
  255. return &result, nil
  256. }
  257. func DelNotebook(jobID string) (*models.NotebookDelResult, error) {
  258. checkSetting()
  259. client := getRestyClient()
  260. var result models.NotebookDelResult
  261. retry := 0
  262. sendjob:
  263. res, err := client.R().
  264. SetHeader("Content-Type", "application/json").
  265. SetAuthToken(TOKEN).
  266. SetResult(&result).
  267. Delete(HOST + "/v1/" + setting.ProjectID + urlNotebook + "/" + jobID)
  268. if err != nil {
  269. return &result, fmt.Errorf("resty DelJob: %v", err)
  270. }
  271. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  272. retry++
  273. _ = getToken()
  274. goto sendjob
  275. }
  276. var response models.NotebookResult
  277. err = json.Unmarshal(res.Body(), &response)
  278. if err != nil {
  279. log.Error("json.Unmarshal failed: %s", err.Error())
  280. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  281. }
  282. if len(response.ErrorCode) != 0 {
  283. log.Error("DelJob failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  284. return &result, fmt.Errorf("DelJob failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  285. }
  286. return &result, nil
  287. }
  288. func DelNotebook2(jobID string) (*models.NotebookDelResult, error) {
  289. checkSetting()
  290. client := getRestyClient()
  291. var result models.NotebookDelResult
  292. retry := 0
  293. sendjob:
  294. res, err := client.R().
  295. SetHeader("Content-Type", "application/json").
  296. SetAuthToken(TOKEN).
  297. SetResult(&result).
  298. Delete(HOST + "/v1/" + setting.ProjectID + urlNotebook2 + "/" + jobID)
  299. if err != nil {
  300. return &result, fmt.Errorf("resty DelJob: %v", err)
  301. }
  302. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  303. retry++
  304. _ = getToken()
  305. goto sendjob
  306. }
  307. var response models.NotebookResult
  308. err = json.Unmarshal(res.Body(), &response)
  309. if err != nil {
  310. log.Error("json.Unmarshal failed: %s", err.Error())
  311. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  312. }
  313. if len(response.ErrorCode) != 0 {
  314. log.Error("DelNotebook2 failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  315. if response.ErrorCode == modelartsIllegalToken && retry < 1 {
  316. retry++
  317. _ = getToken()
  318. goto sendjob
  319. }
  320. return &result, fmt.Errorf("DelNotebook2 failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  321. }
  322. return &result, nil
  323. }
  324. func DelJob(jobID string) (*models.NotebookDelResult, error) {
  325. checkSetting()
  326. client := getRestyClient()
  327. var result models.NotebookDelResult
  328. retry := 0
  329. sendjob:
  330. res, err := client.R().
  331. SetHeader("Content-Type", "application/json").
  332. SetAuthToken(TOKEN).
  333. SetResult(&result).
  334. Delete(HOST + "/v1/" + setting.ProjectID + urlNotebook + "/" + jobID)
  335. if err != nil {
  336. return &result, fmt.Errorf("resty DelJob: %v", err)
  337. }
  338. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  339. retry++
  340. _ = getToken()
  341. goto sendjob
  342. }
  343. var response models.NotebookResult
  344. err = json.Unmarshal(res.Body(), &response)
  345. if err != nil {
  346. log.Error("json.Unmarshal failed: %s", err.Error())
  347. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  348. }
  349. if len(response.ErrorCode) != 0 {
  350. log.Error("DelJob failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  351. return &result, fmt.Errorf("DelJob failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  352. }
  353. return &result, nil
  354. }
  355. func GetJobToken(jobID string) (*models.NotebookGetJobTokenResult, error) {
  356. checkSetting()
  357. client := getRestyClient()
  358. var result models.NotebookGetJobTokenResult
  359. retry := 0
  360. sendjob:
  361. res, err := client.R().
  362. SetHeader("Content-Type", "application/json").
  363. SetAuthToken(TOKEN).
  364. SetResult(&result).
  365. Get(HOST + "/v1/" + setting.ProjectID + urlNotebook + "/" + jobID + "/token")
  366. if err != nil {
  367. return &result, fmt.Errorf("resty GetJobToken: %v", err)
  368. }
  369. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  370. retry++
  371. _ = getToken()
  372. goto sendjob
  373. }
  374. var response models.NotebookResult
  375. err = json.Unmarshal(res.Body(), &response)
  376. if err != nil {
  377. log.Error("json.Unmarshal failed: %s", err.Error())
  378. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  379. }
  380. if len(response.ErrorCode) != 0 {
  381. log.Error("GetJobToken failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  382. return &result, fmt.Errorf("GetJobToken failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  383. }
  384. return &result, nil
  385. }
  386. func createTrainJobUserImage(createJobParams models.CreateUserImageTrainJobParams) (*models.CreateTrainJobResult, error) {
  387. checkSetting()
  388. client := getRestyClient()
  389. var result models.CreateTrainJobResult
  390. retry := 0
  391. sendjob:
  392. res, err := client.R().
  393. SetHeader("Content-Type", "application/json").
  394. SetAuthToken(TOKEN).
  395. SetBody(createJobParams).
  396. SetResult(&result).
  397. Post(HOST + "/v1/" + setting.ProjectID + urlTrainJob)
  398. if err != nil {
  399. return nil, fmt.Errorf("resty create train-job: %s", err)
  400. }
  401. req, _ := json.Marshal(createJobParams)
  402. log.Info("%s", req)
  403. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  404. retry++
  405. _ = getToken()
  406. goto sendjob
  407. }
  408. if res.StatusCode() != http.StatusOK {
  409. var temp models.ErrorResult
  410. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  411. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  412. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  413. }
  414. log.Error("createTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  415. BootFileErrorMsg := "Invalid OBS path '" + createJobParams.Config.BootFileUrl + "'."
  416. DataSetErrorMsg := "Invalid OBS path '" + createJobParams.Config.DataUrl + "'."
  417. if temp.ErrorMsg == BootFileErrorMsg {
  418. log.Error("启动文件错误!createTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  419. return &result, fmt.Errorf("启动文件错误!")
  420. }
  421. if temp.ErrorMsg == DataSetErrorMsg {
  422. log.Error("数据集错误!createTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  423. return &result, fmt.Errorf("数据集错误!")
  424. }
  425. return &result, fmt.Errorf("createTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  426. }
  427. if !result.IsSuccess {
  428. log.Error("createTrainJob failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  429. return &result, fmt.Errorf("createTrainJob failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  430. }
  431. return &result, nil
  432. }
  433. func createTrainJob(createJobParams models.CreateTrainJobParams) (*models.CreateTrainJobResult, error) {
  434. checkSetting()
  435. client := getRestyClient()
  436. var result models.CreateTrainJobResult
  437. retry := 0
  438. sendjob:
  439. res, err := client.R().
  440. SetHeader("Content-Type", "application/json").
  441. SetAuthToken(TOKEN).
  442. SetBody(createJobParams).
  443. SetResult(&result).
  444. Post(HOST + "/v1/" + setting.ProjectID + urlTrainJob)
  445. if err != nil {
  446. return nil, fmt.Errorf("resty create train-job: %s", err)
  447. }
  448. req, _ := json.Marshal(createJobParams)
  449. log.Info("%s", req)
  450. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  451. retry++
  452. _ = getToken()
  453. goto sendjob
  454. }
  455. if res.StatusCode() != http.StatusOK {
  456. var temp models.ErrorResult
  457. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  458. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  459. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  460. }
  461. log.Error("createTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  462. BootFileErrorMsg := "Invalid OBS path '" + createJobParams.Config.BootFileUrl + "'."
  463. DataSetErrorMsg := "Invalid OBS path '" + createJobParams.Config.DataUrl + "'."
  464. if temp.ErrorMsg == BootFileErrorMsg {
  465. log.Error("启动文件错误!createTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  466. return &result, fmt.Errorf("启动文件错误!")
  467. }
  468. if temp.ErrorMsg == DataSetErrorMsg {
  469. log.Error("数据集错误!createTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  470. return &result, fmt.Errorf("数据集错误!")
  471. }
  472. return &result, fmt.Errorf("createTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  473. }
  474. if !result.IsSuccess {
  475. log.Error("createTrainJob failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  476. return &result, fmt.Errorf("createTrainJob failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  477. }
  478. return &result, nil
  479. }
  480. func createTrainJobVersion(createJobVersionParams models.CreateTrainJobVersionParams, jobID string) (*models.CreateTrainJobResult, error) {
  481. checkSetting()
  482. client := getRestyClient()
  483. var result models.CreateTrainJobResult
  484. retry := 0
  485. sendjob:
  486. res, err := client.R().
  487. SetHeader("Content-Type", "application/json").
  488. SetAuthToken(TOKEN).
  489. SetBody(createJobVersionParams).
  490. SetResult(&result).
  491. Post(HOST + "/v1/" + setting.ProjectID + urlTrainJob + "/" + jobID + "/versions")
  492. if err != nil {
  493. return nil, fmt.Errorf("resty create train-job version: %s", err)
  494. }
  495. req, _ := json.Marshal(createJobVersionParams)
  496. log.Info("%s", req)
  497. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  498. retry++
  499. _ = getToken()
  500. goto sendjob
  501. }
  502. if res.StatusCode() != http.StatusOK {
  503. var temp models.ErrorResult
  504. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  505. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  506. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  507. }
  508. BootFileErrorMsg := "Invalid OBS path '" + createJobVersionParams.Config.BootFileUrl + "'."
  509. DataSetErrorMsg := "Invalid OBS path '" + createJobVersionParams.Config.DataUrl + "'."
  510. if temp.ErrorMsg == BootFileErrorMsg {
  511. log.Error("启动文件错误!createTrainJobVersion failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  512. return &result, fmt.Errorf("启动文件错误!")
  513. }
  514. if temp.ErrorMsg == DataSetErrorMsg {
  515. log.Error("数据集错误!createTrainJobVersion failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  516. return &result, fmt.Errorf("数据集错误!")
  517. }
  518. return &result, fmt.Errorf("createTrainJobVersion failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  519. }
  520. if !result.IsSuccess {
  521. log.Error("createTrainJobVersion failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  522. return &result, fmt.Errorf("createTrainJobVersion failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  523. }
  524. return &result, nil
  525. }
  526. func GetResourceSpecs() (*models.GetResourceSpecsResult, error) {
  527. checkSetting()
  528. client := getRestyClient()
  529. var result models.GetResourceSpecsResult
  530. retry := 0
  531. sendjob:
  532. res, err := client.R().
  533. SetHeader("Content-Type", "application/json").
  534. SetAuthToken(TOKEN).
  535. SetResult(&result).
  536. Get(HOST + "/v1/" + setting.ProjectID + urlResourceSpecs)
  537. if err != nil {
  538. return nil, fmt.Errorf("resty GetResourceSpecs: %v", err)
  539. }
  540. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  541. retry++
  542. _ = getToken()
  543. goto sendjob
  544. }
  545. if res.StatusCode() != http.StatusOK {
  546. var temp models.ErrorResult
  547. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  548. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  549. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  550. }
  551. log.Error("GetResourceSpecs failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  552. return &result, fmt.Errorf("GetResourceSpecs failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  553. }
  554. if !result.IsSuccess {
  555. log.Error("GetResourceSpecs failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  556. return &result, fmt.Errorf("GetResourceSpecs failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  557. }
  558. return &result, nil
  559. }
  560. func CreateTrainJobConfig(req models.CreateConfigParams) (*models.CreateTrainJobConfigResult, error) {
  561. checkSetting()
  562. client := getRestyClient()
  563. var result models.CreateTrainJobConfigResult
  564. retry := 0
  565. sendjob:
  566. res, err := client.R().
  567. SetHeader("Content-Type", "application/json").
  568. SetAuthToken(TOKEN).
  569. SetBody(req).
  570. SetResult(&result).
  571. Post(HOST + "/v1/" + setting.ProjectID + urlTrainJobConfig)
  572. if err != nil {
  573. return nil, fmt.Errorf("resty CreateTrainJobConfig: %s", err)
  574. }
  575. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  576. retry++
  577. _ = getToken()
  578. goto sendjob
  579. }
  580. //temp, _ := json.Marshal(req)
  581. //log.Info("%s", temp)
  582. if res.StatusCode() != http.StatusOK {
  583. var temp models.ErrorResult
  584. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  585. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  586. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  587. }
  588. log.Error("CreateTrainJobConfig failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  589. return &result, fmt.Errorf("CreateTrainJobConfig failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  590. }
  591. if !result.IsSuccess {
  592. log.Error("CreateTrainJobConfig failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  593. return &result, fmt.Errorf("CreateTrainJobConfig failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  594. }
  595. return &result, nil
  596. }
  597. func GetConfigList(perPage, page int, sortBy, order, searchContent, configType string) (*models.GetConfigListResult, error) {
  598. checkSetting()
  599. client := getRestyClient()
  600. var result models.GetConfigListResult
  601. retry := 0
  602. sendjob:
  603. res, err := client.R().
  604. SetQueryParams(map[string]string{
  605. "per_page": strconv.Itoa(perPage),
  606. "page": strconv.Itoa(page),
  607. "sortBy": sortBy,
  608. "order": order,
  609. "search_content": searchContent,
  610. "config_type": configType,
  611. }).
  612. SetAuthToken(TOKEN).
  613. SetResult(&result).
  614. Get(HOST + "/v1/" + setting.ProjectID + urlTrainJobConfig)
  615. if err != nil {
  616. return nil, fmt.Errorf("resty GetConfigList: %v", err)
  617. }
  618. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  619. retry++
  620. _ = getToken()
  621. goto sendjob
  622. }
  623. if res.StatusCode() != http.StatusOK {
  624. var temp models.ErrorResult
  625. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  626. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  627. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  628. }
  629. log.Error("GetConfigList failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  630. return &result, fmt.Errorf("获取参数配置列表失败(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  631. }
  632. if !result.IsSuccess {
  633. log.Error("GetConfigList failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  634. return &result, fmt.Errorf("获取参数配置列表失败(%s): %s", result.ErrorCode, result.ErrorMsg)
  635. }
  636. return &result, nil
  637. }
  638. func GetParaConfig(configName, configType string) (models.GetConfigResult, error) {
  639. checkSetting()
  640. client := getRestyClient()
  641. var result models.GetConfigResult
  642. retry := 0
  643. sendjob:
  644. res, err := client.R().
  645. SetQueryParams(map[string]string{
  646. "config_type": configType,
  647. }).
  648. SetAuthToken(TOKEN).
  649. SetResult(&result).
  650. Get(HOST + "/v1/" + setting.ProjectID + urlTrainJobConfig + "/" + configName)
  651. if err != nil {
  652. return result, fmt.Errorf("resty GetParaConfig: %v", err)
  653. }
  654. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  655. retry++
  656. _ = getToken()
  657. goto sendjob
  658. }
  659. if res.StatusCode() != http.StatusOK {
  660. var temp models.ErrorResult
  661. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  662. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  663. return result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  664. }
  665. log.Error("GetParaConfig failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  666. return result, fmt.Errorf("获取参数配置详情失败(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  667. }
  668. if !result.IsSuccess {
  669. log.Error("GetParaConfig failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  670. return result, fmt.Errorf("获取参数配置详情失败(%s): %s", result.ErrorCode, result.ErrorMsg)
  671. }
  672. return result, nil
  673. }
  674. func GetTrainJob(jobID, versionID string) (*models.GetTrainJobResult, error) {
  675. checkSetting()
  676. client := getRestyClient()
  677. var result models.GetTrainJobResult
  678. retry := 0
  679. sendjob:
  680. res, err := client.R().
  681. SetAuthToken(TOKEN).
  682. SetResult(&result).
  683. Get(HOST + "/v1/" + setting.ProjectID + urlTrainJob + "/" + jobID + "/versions/" + versionID)
  684. if err != nil {
  685. return nil, fmt.Errorf("resty GetTrainJob: %v", err)
  686. }
  687. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  688. retry++
  689. _ = getToken()
  690. goto sendjob
  691. }
  692. if res.StatusCode() != http.StatusOK {
  693. var temp models.ErrorResult
  694. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  695. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  696. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  697. }
  698. log.Error("GetTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  699. return &result, fmt.Errorf("获取作业详情失败(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  700. }
  701. if !result.IsSuccess {
  702. log.Error("GetTrainJob(%s) failed", jobID)
  703. return &result, fmt.Errorf("获取作业详情失败")
  704. }
  705. return &result, nil
  706. }
  707. func GetTrainJobLog(jobID, versionID, baseLine, logFile, order string, lines int) (*models.GetTrainJobLogResult, error) {
  708. checkSetting()
  709. client := getRestyClient()
  710. var result models.GetTrainJobLogResult
  711. retry := 0
  712. sendjob:
  713. res, err := client.R().
  714. SetQueryParams(map[string]string{
  715. "base_line": baseLine,
  716. "lines": strconv.Itoa(lines),
  717. "log_file": logFile,
  718. "order": order,
  719. }).
  720. SetAuthToken(TOKEN).
  721. SetResult(&result).
  722. Get(HOST + "/v1/" + setting.ProjectID + urlTrainJob + "/" + jobID + "/versions/" + versionID + "/aom-log")
  723. if err != nil {
  724. return nil, fmt.Errorf("resty GetTrainJobLog: %v", err)
  725. }
  726. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  727. retry++
  728. _ = getToken()
  729. goto sendjob
  730. }
  731. if res.StatusCode() != http.StatusOK {
  732. var temp models.ErrorResult
  733. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  734. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  735. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  736. }
  737. log.Error("GetTrainJobLog failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  738. return &result, fmt.Errorf("获取作业日志失败(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  739. }
  740. if !result.IsSuccess {
  741. log.Error("GetTrainJobLog(%s) failed", jobID)
  742. return &result, fmt.Errorf("获取作业日志失败:%s", result.ErrorMsg)
  743. }
  744. return &result, nil
  745. }
  746. func GetTrainJobLogFileNames(jobID, versionID string) (*models.GetTrainJobLogFileNamesResult, error) {
  747. checkSetting()
  748. client := getRestyClient()
  749. var result models.GetTrainJobLogFileNamesResult
  750. retry := 0
  751. sendjob:
  752. res, err := client.R().
  753. SetAuthToken(TOKEN).
  754. SetResult(&result).
  755. Get(HOST + "/v1/" + setting.ProjectID + urlTrainJob + "/" + jobID + "/versions/" + versionID + "/log/file-names")
  756. if err != nil {
  757. return nil, fmt.Errorf("resty GetTrainJobLogFileNames: %v", err)
  758. }
  759. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  760. retry++
  761. _ = getToken()
  762. goto sendjob
  763. }
  764. if res.StatusCode() != http.StatusOK {
  765. var temp models.ErrorResult
  766. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  767. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  768. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  769. }
  770. log.Error("GetTrainJobLogFileNames failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  771. return &result, fmt.Errorf("GetTrainJobLogFileNames failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  772. }
  773. if !result.IsSuccess {
  774. log.Error("GetTrainJobLogFileNames(%s) failed", jobID)
  775. return &result, fmt.Errorf("获取作业日志文件失败:%s", result.ErrorMsg)
  776. }
  777. return &result, nil
  778. }
  779. func DelTrainJob(jobID string) (*models.TrainJobResult, error) {
  780. checkSetting()
  781. client := getRestyClient()
  782. var result models.TrainJobResult
  783. retry := 0
  784. sendjob:
  785. res, err := client.R().
  786. SetAuthToken(TOKEN).
  787. SetResult(&result).
  788. Delete(HOST + "/v1/" + setting.ProjectID + urlTrainJob + "/" + jobID)
  789. if err != nil {
  790. return &result, fmt.Errorf("resty DelTrainJob: %v", err)
  791. }
  792. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  793. retry++
  794. _ = getToken()
  795. goto sendjob
  796. }
  797. if res.StatusCode() != http.StatusOK {
  798. var temp models.ErrorResult
  799. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  800. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  801. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  802. }
  803. log.Error("DelTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  804. return &result, fmt.Errorf("删除训练作业失败(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  805. }
  806. if !result.IsSuccess {
  807. log.Error("DelTrainJob(%s) failed", jobID)
  808. return &result, fmt.Errorf("删除训练作业失败:%s", result.ErrorMsg)
  809. }
  810. return &result, nil
  811. }
  812. func StopTrainJob(jobID, versionID string) (*models.TrainJobResult, error) {
  813. checkSetting()
  814. client := getRestyClient()
  815. var result models.TrainJobResult
  816. retry := 0
  817. sendjob:
  818. res, err := client.R().
  819. SetAuthToken(TOKEN).
  820. SetResult(&result).
  821. Post(HOST + "/v1/" + setting.ProjectID + urlTrainJob + "/" + jobID + "/versions/" + versionID + "/stop")
  822. if err != nil {
  823. return &result, fmt.Errorf("resty StopTrainJob: %v", err)
  824. }
  825. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  826. retry++
  827. _ = getToken()
  828. goto sendjob
  829. }
  830. if res.StatusCode() != http.StatusOK {
  831. var temp models.ErrorResult
  832. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  833. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  834. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  835. }
  836. log.Error("StopTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  837. return &result, fmt.Errorf("停止训练作业失败(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  838. }
  839. if !result.IsSuccess {
  840. log.Error("StopTrainJob(%s) failed", jobID)
  841. return &result, fmt.Errorf("停止训练作业失败:%s", result.ErrorMsg)
  842. }
  843. return &result, nil
  844. }
  845. func DelTrainJobVersion(jobID string, versionID string) (*models.TrainJobResult, error) {
  846. checkSetting()
  847. client := getRestyClient()
  848. var result models.TrainJobResult
  849. retry := 0
  850. sendjob:
  851. res, err := client.R().
  852. SetAuthToken(TOKEN).
  853. SetResult(&result).
  854. Delete(HOST + "/v1/" + setting.ProjectID + urlTrainJob + "/" + jobID + "/versions/" + versionID)
  855. if err != nil {
  856. return &result, fmt.Errorf("resty DelTrainJobVersion: %v", err)
  857. }
  858. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  859. retry++
  860. _ = getToken()
  861. goto sendjob
  862. }
  863. if res.StatusCode() != http.StatusOK {
  864. var temp models.ErrorResult
  865. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  866. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  867. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  868. }
  869. log.Error("DelTrainJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  870. return &result, fmt.Errorf("删除训练作业版本失败(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  871. }
  872. if !result.IsSuccess {
  873. log.Error("DelTrainJob(%s) failed", jobID)
  874. return &result, fmt.Errorf("删除训练作业版本失败:%s", result.ErrorMsg)
  875. }
  876. return &result, nil
  877. }
  878. func createInferenceJob(createJobParams models.CreateInferenceJobParams) (*models.CreateTrainJobResult, error) {
  879. checkSetting()
  880. client := getRestyClient()
  881. var result models.CreateTrainJobResult
  882. retry := 0
  883. sendjob:
  884. res, err := client.R().
  885. SetHeader("Content-Type", "application/json").
  886. SetAuthToken(TOKEN).
  887. SetBody(createJobParams).
  888. SetResult(&result).
  889. Post(HOST + "/v1/" + setting.ProjectID + urlTrainJob)
  890. if err != nil {
  891. return nil, fmt.Errorf("resty create inference-job: %s", err)
  892. }
  893. req, _ := json.Marshal(createJobParams)
  894. log.Info("%s", req)
  895. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  896. retry++
  897. _ = getToken()
  898. goto sendjob
  899. }
  900. if res.StatusCode() != http.StatusOK {
  901. var temp models.ErrorResult
  902. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  903. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  904. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  905. }
  906. log.Error("createInferenceJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  907. BootFileErrorMsg := "Invalid OBS path '" + createJobParams.InfConfig.BootFileUrl + "'."
  908. DataSetErrorMsg := "Invalid OBS path '" + createJobParams.InfConfig.DataUrl + "'."
  909. if temp.ErrorMsg == BootFileErrorMsg {
  910. log.Error("启动文件错误!createInferenceJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  911. return &result, fmt.Errorf("启动文件错误!")
  912. }
  913. if temp.ErrorMsg == DataSetErrorMsg {
  914. log.Error("数据集错误!createInferenceJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  915. return &result, fmt.Errorf("数据集错误!")
  916. }
  917. return &result, fmt.Errorf("createInferenceJob failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  918. }
  919. if !result.IsSuccess {
  920. log.Error("createInferenceJob failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  921. return &result, fmt.Errorf("createInferenceJob failed(%s): %s", result.ErrorCode, result.ErrorMsg)
  922. }
  923. return &result, nil
  924. }
  925. func createNotebook2(createJobParams models.CreateNotebook2Params) (*models.CreateNotebookResult, error) {
  926. checkSetting()
  927. client := getRestyClient()
  928. var result models.CreateNotebookResult
  929. retry := 0
  930. sendjob:
  931. res, err := client.R().
  932. SetHeader("Content-Type", "application/json").
  933. SetAuthToken(TOKEN).
  934. SetBody(createJobParams).
  935. SetResult(&result).
  936. Post(HOST + "/v1/" + setting.ProjectID + urlNotebook2)
  937. if err != nil {
  938. return nil, fmt.Errorf("resty create notebook2: %s", err)
  939. }
  940. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  941. retry++
  942. _ = getToken()
  943. goto sendjob
  944. }
  945. var response models.NotebookResult
  946. err = json.Unmarshal(res.Body(), &response)
  947. if err != nil {
  948. log.Error("json.Unmarshal failed: %s", err.Error())
  949. return &result, fmt.Errorf("son.Unmarshal failed: %s", err.Error())
  950. }
  951. if len(response.ErrorCode) != 0 {
  952. log.Error("createNotebook2 failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  953. if response.ErrorCode == errorCodeExceedLimit {
  954. response.ErrorMsg = "所选规格使用数量已超过最大配额限制。"
  955. }
  956. if response.ErrorCode == modelartsIllegalToken && retry < 1 {
  957. retry++
  958. _ = getToken()
  959. goto sendjob
  960. }
  961. return &result, fmt.Errorf("createNotebook2 failed(%s): %s", response.ErrorCode, response.ErrorMsg)
  962. }
  963. return &result, nil
  964. }
  965. func GetTrainJobMetricStatistic(jobID, versionID, podName string) (*models.GetTrainJobMetricStatisticResult, error) {
  966. checkSetting()
  967. client := getRestyClient()
  968. var result models.GetTrainJobMetricStatisticResult
  969. retry := 0
  970. sendjob:
  971. res, err := client.R().
  972. SetAuthToken(TOKEN).
  973. SetResult(&result).
  974. Get(HOST + "/v1/" + setting.ProjectID + urlTrainJob + "/" + jobID + "/versions/" + versionID + "/pod/" + podName + "/metric-statistic?statistic_type=each")
  975. if err != nil {
  976. return nil, fmt.Errorf("resty GetTrainJobMetricStatistic: %v", err)
  977. }
  978. if res.StatusCode() == http.StatusUnauthorized && retry < 1 {
  979. retry++
  980. _ = getToken()
  981. goto sendjob
  982. }
  983. if res.StatusCode() != http.StatusOK {
  984. var temp models.ErrorResult
  985. if err = json.Unmarshal([]byte(res.String()), &temp); err != nil {
  986. log.Error("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  987. return &result, fmt.Errorf("json.Unmarshal failed(%s): %v", res.String(), err.Error())
  988. }
  989. log.Error("GetTrainJobMetricStatistic failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  990. return &result, fmt.Errorf("GetTrainJobMetricStatistic failed(%d):%s(%s)", res.StatusCode(), temp.ErrorCode, temp.ErrorMsg)
  991. }
  992. if !result.IsSuccess {
  993. log.Error("GetTrainJobMetricStatistic(%s) failed", jobID)
  994. return &result, fmt.Errorf("获取任务资源占用情况失败:%s", result.ErrorMsg)
  995. }
  996. return &result, nil
  997. }