/
handler_inference_create.go
42 lines (34 loc) · 1.13 KB
/
handler_inference_create.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
package server
import (
"net/http"
"github.com/gin-gonic/gin"
"github.com/tensorchord/openmodelz/agent/api/types"
)
// @Summary Create the inferences.
// @Description Create the inferences.
// @Tags inference
// @Accept json
// @Produce json
// @Param request body types.InferenceDeployment true "query params"
// @Success 201 {object} types.InferenceDeployment
// @Router /system/inferences [post]
func (s *Server) handleInferenceCreate(c *gin.Context) error {
event := types.DeploymentCreateEvent
var req types.InferenceDeployment
if err := c.ShouldBindJSON(&req); err != nil {
return NewError(http.StatusBadRequest, err, event)
}
// Set the default values.
s.validator.DefaultDeployRequest(&req)
// Validate the request.
if err := s.validator.ValidateDeployRequest(&req); err != nil {
return NewError(http.StatusBadRequest, err, event)
}
// Create the inference.
if err := s.runtime.InferenceCreate(c.Request.Context(), req,
s.config.Ingress.Domain, s.config.Ingress.Namespace, event); err != nil {
return errFromErrDefs(err, event)
}
c.JSON(http.StatusCreated, req)
return nil
}