mirror of https://github.com/databricks/cli.git
394 lines
11 KiB
Go
Executable File
394 lines
11 KiB
Go
Executable File
// Code generated from OpenAPI specs by Databricks SDK Generator. DO NOT EDIT.
|
|
|
|
package serving_endpoints
|
|
|
|
import (
|
|
"fmt"
|
|
"time"
|
|
|
|
"github.com/databricks/bricks/cmd/root"
|
|
"github.com/databricks/bricks/libs/cmdio"
|
|
"github.com/databricks/bricks/libs/flags"
|
|
"github.com/databricks/databricks-sdk-go/retries"
|
|
"github.com/databricks/databricks-sdk-go/service/serving"
|
|
"github.com/spf13/cobra"
|
|
)
|
|
|
|
var Cmd = &cobra.Command{
|
|
Use: "serving-endpoints",
|
|
Short: `The Serving Endpoints API allows you to create, update, and delete model serving endpoints.`,
|
|
Long: `The Serving Endpoints API allows you to create, update, and delete model
|
|
serving endpoints.
|
|
|
|
You can use a serving endpoint to serve models from the Databricks Model
|
|
Registry. Endpoints expose the underlying models as scalable REST API
|
|
endpoints using serverless compute. This means the endpoints and associated
|
|
compute resources are fully managed by Databricks and will not appear in your
|
|
cloud account. A serving endpoint can consist of one or more MLflow models
|
|
from the Databricks Model Registry, called served models. A serving endpoint
|
|
can have at most ten served models. You can configure traffic settings to
|
|
define how requests should be routed to your served models behind an endpoint.
|
|
Additionally, you can configure the scale of resources that should be applied
|
|
to each served model.`,
|
|
}
|
|
|
|
// start build-logs command
|
|
|
|
var buildLogsReq serving.BuildLogsRequest
|
|
|
|
func init() {
|
|
Cmd.AddCommand(buildLogsCmd)
|
|
// TODO: short flags
|
|
|
|
}
|
|
|
|
var buildLogsCmd = &cobra.Command{
|
|
Use: "build-logs NAME SERVED_MODEL_NAME",
|
|
Short: `Retrieve the logs associated with building the model's environment for a given serving endpoint's served model.`,
|
|
Long: `Retrieve the logs associated with building the model's environment for a given
|
|
serving endpoint's served model.
|
|
|
|
Retrieves the build logs associated with the provided served model.`,
|
|
|
|
Annotations: map[string]string{},
|
|
Args: cobra.ExactArgs(2),
|
|
PreRunE: root.MustWorkspaceClient,
|
|
RunE: func(cmd *cobra.Command, args []string) (err error) {
|
|
ctx := cmd.Context()
|
|
w := root.WorkspaceClient(ctx)
|
|
buildLogsReq.Name = args[0]
|
|
buildLogsReq.ServedModelName = args[1]
|
|
|
|
response, err := w.ServingEndpoints.BuildLogs(ctx, buildLogsReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return cmdio.Render(ctx, response)
|
|
},
|
|
}
|
|
|
|
// start create command
|
|
|
|
var createReq serving.CreateServingEndpoint
|
|
var createJson flags.JsonFlag
|
|
var createSkipWait bool
|
|
var createTimeout time.Duration
|
|
|
|
func init() {
|
|
Cmd.AddCommand(createCmd)
|
|
|
|
createCmd.Flags().BoolVar(&createSkipWait, "no-wait", createSkipWait, `do not wait to reach NOT_UPDATING state`)
|
|
createCmd.Flags().DurationVar(&createTimeout, "timeout", 20*time.Minute, `maximum amount of time to reach NOT_UPDATING state`)
|
|
// TODO: short flags
|
|
createCmd.Flags().Var(&createJson, "json", `either inline JSON string or @path/to/file.json with request body`)
|
|
|
|
}
|
|
|
|
var createCmd = &cobra.Command{
|
|
Use: "create",
|
|
Short: `Create a new serving endpoint.`,
|
|
Long: `Create a new serving endpoint.`,
|
|
|
|
Annotations: map[string]string{},
|
|
PreRunE: root.MustWorkspaceClient,
|
|
RunE: func(cmd *cobra.Command, args []string) (err error) {
|
|
ctx := cmd.Context()
|
|
w := root.WorkspaceClient(ctx)
|
|
err = createJson.Unmarshal(&createReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
createReq.Name = args[0]
|
|
_, err = fmt.Sscan(args[1], &createReq.Config)
|
|
if err != nil {
|
|
return fmt.Errorf("invalid CONFIG: %s", args[1])
|
|
}
|
|
|
|
if createSkipWait {
|
|
response, err := w.ServingEndpoints.Create(ctx, createReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return cmdio.Render(ctx, response)
|
|
}
|
|
spinner := cmdio.Spinner(ctx)
|
|
info, err := w.ServingEndpoints.CreateAndWait(ctx, createReq,
|
|
retries.Timeout[serving.ServingEndpointDetailed](createTimeout),
|
|
func(i *retries.Info[serving.ServingEndpointDetailed]) {
|
|
if i.Info == nil {
|
|
return
|
|
}
|
|
status := i.Info.State.ConfigUpdate
|
|
statusMessage := fmt.Sprintf("current status: %s", status)
|
|
spinner <- statusMessage
|
|
})
|
|
close(spinner)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return cmdio.Render(ctx, info)
|
|
},
|
|
}
|
|
|
|
// start delete command
|
|
|
|
var deleteReq serving.DeleteServingEndpointRequest
|
|
|
|
func init() {
|
|
Cmd.AddCommand(deleteCmd)
|
|
// TODO: short flags
|
|
|
|
}
|
|
|
|
var deleteCmd = &cobra.Command{
|
|
Use: "delete NAME",
|
|
Short: `Delete a serving endpoint.`,
|
|
Long: `Delete a serving endpoint.`,
|
|
|
|
Annotations: map[string]string{},
|
|
Args: cobra.ExactArgs(1),
|
|
PreRunE: root.MustWorkspaceClient,
|
|
RunE: func(cmd *cobra.Command, args []string) (err error) {
|
|
ctx := cmd.Context()
|
|
w := root.WorkspaceClient(ctx)
|
|
deleteReq.Name = args[0]
|
|
|
|
err = w.ServingEndpoints.Delete(ctx, deleteReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return nil
|
|
},
|
|
}
|
|
|
|
// start export-metrics command
|
|
|
|
var exportMetricsReq serving.ExportMetricsRequest
|
|
|
|
func init() {
|
|
Cmd.AddCommand(exportMetricsCmd)
|
|
// TODO: short flags
|
|
|
|
}
|
|
|
|
var exportMetricsCmd = &cobra.Command{
|
|
Use: "export-metrics NAME",
|
|
Short: `Retrieve the metrics corresponding to a serving endpoint for the current time in Prometheus or OpenMetrics exposition format.`,
|
|
Long: `Retrieve the metrics corresponding to a serving endpoint for the current time
|
|
in Prometheus or OpenMetrics exposition format.
|
|
|
|
Retrieves the metrics associated with the provided serving endpoint in either
|
|
Prometheus or OpenMetrics exposition format.`,
|
|
|
|
Annotations: map[string]string{},
|
|
Args: cobra.ExactArgs(1),
|
|
PreRunE: root.MustWorkspaceClient,
|
|
RunE: func(cmd *cobra.Command, args []string) (err error) {
|
|
ctx := cmd.Context()
|
|
w := root.WorkspaceClient(ctx)
|
|
exportMetricsReq.Name = args[0]
|
|
|
|
err = w.ServingEndpoints.ExportMetrics(ctx, exportMetricsReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return nil
|
|
},
|
|
}
|
|
|
|
// start get command
|
|
|
|
var getReq serving.GetServingEndpointRequest
|
|
|
|
func init() {
|
|
Cmd.AddCommand(getCmd)
|
|
// TODO: short flags
|
|
|
|
}
|
|
|
|
var getCmd = &cobra.Command{
|
|
Use: "get NAME",
|
|
Short: `Get a single serving endpoint.`,
|
|
Long: `Get a single serving endpoint.
|
|
|
|
Retrieves the details for a single serving endpoint.`,
|
|
|
|
Annotations: map[string]string{},
|
|
Args: cobra.ExactArgs(1),
|
|
PreRunE: root.MustWorkspaceClient,
|
|
RunE: func(cmd *cobra.Command, args []string) (err error) {
|
|
ctx := cmd.Context()
|
|
w := root.WorkspaceClient(ctx)
|
|
getReq.Name = args[0]
|
|
|
|
response, err := w.ServingEndpoints.Get(ctx, getReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return cmdio.Render(ctx, response)
|
|
},
|
|
}
|
|
|
|
// start list command
|
|
|
|
func init() {
|
|
Cmd.AddCommand(listCmd)
|
|
|
|
}
|
|
|
|
var listCmd = &cobra.Command{
|
|
Use: "list",
|
|
Short: `Retrieve all serving endpoints.`,
|
|
Long: `Retrieve all serving endpoints.`,
|
|
|
|
Annotations: map[string]string{},
|
|
PreRunE: root.MustWorkspaceClient,
|
|
RunE: func(cmd *cobra.Command, args []string) (err error) {
|
|
ctx := cmd.Context()
|
|
w := root.WorkspaceClient(ctx)
|
|
response, err := w.ServingEndpoints.List(ctx)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return cmdio.Render(ctx, response)
|
|
},
|
|
}
|
|
|
|
// start logs command
|
|
|
|
var logsReq serving.LogsRequest
|
|
|
|
func init() {
|
|
Cmd.AddCommand(logsCmd)
|
|
// TODO: short flags
|
|
|
|
}
|
|
|
|
var logsCmd = &cobra.Command{
|
|
Use: "logs NAME SERVED_MODEL_NAME",
|
|
Short: `Retrieve the most recent log lines associated with a given serving endpoint's served model.`,
|
|
Long: `Retrieve the most recent log lines associated with a given serving endpoint's
|
|
served model.
|
|
|
|
Retrieves the service logs associated with the provided served model.`,
|
|
|
|
Annotations: map[string]string{},
|
|
Args: cobra.ExactArgs(2),
|
|
PreRunE: root.MustWorkspaceClient,
|
|
RunE: func(cmd *cobra.Command, args []string) (err error) {
|
|
ctx := cmd.Context()
|
|
w := root.WorkspaceClient(ctx)
|
|
logsReq.Name = args[0]
|
|
logsReq.ServedModelName = args[1]
|
|
|
|
response, err := w.ServingEndpoints.Logs(ctx, logsReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return cmdio.Render(ctx, response)
|
|
},
|
|
}
|
|
|
|
// start query command
|
|
|
|
var queryReq serving.QueryRequest
|
|
|
|
func init() {
|
|
Cmd.AddCommand(queryCmd)
|
|
// TODO: short flags
|
|
|
|
}
|
|
|
|
var queryCmd = &cobra.Command{
|
|
Use: "query NAME",
|
|
Short: `Query a serving endpoint with provided model input.`,
|
|
Long: `Query a serving endpoint with provided model input.`,
|
|
|
|
Annotations: map[string]string{},
|
|
Args: cobra.ExactArgs(1),
|
|
PreRunE: root.MustWorkspaceClient,
|
|
RunE: func(cmd *cobra.Command, args []string) (err error) {
|
|
ctx := cmd.Context()
|
|
w := root.WorkspaceClient(ctx)
|
|
queryReq.Name = args[0]
|
|
|
|
response, err := w.ServingEndpoints.Query(ctx, queryReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return cmdio.Render(ctx, response)
|
|
},
|
|
}
|
|
|
|
// start update-config command
|
|
|
|
var updateConfigReq serving.EndpointCoreConfigInput
|
|
var updateConfigJson flags.JsonFlag
|
|
var updateConfigSkipWait bool
|
|
var updateConfigTimeout time.Duration
|
|
|
|
func init() {
|
|
Cmd.AddCommand(updateConfigCmd)
|
|
|
|
updateConfigCmd.Flags().BoolVar(&updateConfigSkipWait, "no-wait", updateConfigSkipWait, `do not wait to reach NOT_UPDATING state`)
|
|
updateConfigCmd.Flags().DurationVar(&updateConfigTimeout, "timeout", 20*time.Minute, `maximum amount of time to reach NOT_UPDATING state`)
|
|
// TODO: short flags
|
|
updateConfigCmd.Flags().Var(&updateConfigJson, "json", `either inline JSON string or @path/to/file.json with request body`)
|
|
|
|
// TODO: complex arg: traffic_config
|
|
|
|
}
|
|
|
|
var updateConfigCmd = &cobra.Command{
|
|
Use: "update-config",
|
|
Short: `Update a serving endpoint with a new config.`,
|
|
Long: `Update a serving endpoint with a new config.
|
|
|
|
Updates any combination of the serving endpoint's served models, the compute
|
|
configuration of those served models, and the endpoint's traffic config. An
|
|
endpoint that already has an update in progress can not be updated until the
|
|
current update completes or fails.`,
|
|
|
|
Annotations: map[string]string{},
|
|
PreRunE: root.MustWorkspaceClient,
|
|
RunE: func(cmd *cobra.Command, args []string) (err error) {
|
|
ctx := cmd.Context()
|
|
w := root.WorkspaceClient(ctx)
|
|
err = updateConfigJson.Unmarshal(&updateConfigReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
_, err = fmt.Sscan(args[0], &updateConfigReq.ServedModels)
|
|
if err != nil {
|
|
return fmt.Errorf("invalid SERVED_MODELS: %s", args[0])
|
|
}
|
|
updateConfigReq.Name = args[1]
|
|
|
|
if updateConfigSkipWait {
|
|
response, err := w.ServingEndpoints.UpdateConfig(ctx, updateConfigReq)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return cmdio.Render(ctx, response)
|
|
}
|
|
spinner := cmdio.Spinner(ctx)
|
|
info, err := w.ServingEndpoints.UpdateConfigAndWait(ctx, updateConfigReq,
|
|
retries.Timeout[serving.ServingEndpointDetailed](updateConfigTimeout),
|
|
func(i *retries.Info[serving.ServingEndpointDetailed]) {
|
|
if i.Info == nil {
|
|
return
|
|
}
|
|
status := i.Info.State.ConfigUpdate
|
|
statusMessage := fmt.Sprintf("current status: %s", status)
|
|
spinner <- statusMessage
|
|
})
|
|
close(spinner)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
return cmdio.Render(ctx, info)
|
|
},
|
|
}
|
|
|
|
// end service ServingEndpoints
|