databricks-cli/cmd/bundle/generate/pipeline.go

118 lines
3.4 KiB
Go

package generate
import (
"errors"
"fmt"
"io/fs"
"os"
"path/filepath"
"github.com/databricks/cli/bundle/config/generate"
"github.com/databricks/cli/cmd/root"
"github.com/databricks/cli/libs/cmdio"
"github.com/databricks/cli/libs/dyn"
"github.com/databricks/cli/libs/dyn/yamlsaver"
"github.com/databricks/cli/libs/textutil"
"github.com/databricks/databricks-sdk-go/service/pipelines"
"github.com/spf13/cobra"
"gopkg.in/yaml.v3"
)
func NewGeneratePipelineCommand() *cobra.Command {
var configDir string
var sourceDir string
var pipelineId string
var force bool
cmd := &cobra.Command{
Use: "pipeline",
Short: "Generate bundle configuration for a pipeline",
}
cmd.Flags().StringVar(&pipelineId, "existing-pipeline-id", "", `ID of the pipeline to generate config for`)
cmd.MarkFlagRequired("existing-pipeline-id")
wd, err := os.Getwd()
if err != nil {
wd = "."
}
cmd.Flags().StringVarP(&configDir, "config-dir", "d", filepath.Join(wd, "resources"), `Dir path where the output config will be stored`)
cmd.Flags().StringVarP(&sourceDir, "source-dir", "s", filepath.Join(wd, "src"), `Dir path where the downloaded files will be stored`)
cmd.Flags().BoolVarP(&force, "force", "f", false, `Force overwrite existing files in the output directory`)
cmd.RunE = func(cmd *cobra.Command, args []string) error {
ctx := cmd.Context()
b, diags := root.MustConfigureBundle(cmd)
if err := diags.Error(); err != nil {
return diags.Error()
}
w := b.WorkspaceClient()
pipeline, err := w.Pipelines.Get(ctx, pipelines.GetPipelineRequest{PipelineId: pipelineId})
if err != nil {
return err
}
downloader := newDownloader(w, sourceDir, configDir)
for _, lib := range pipeline.Spec.Libraries {
err := downloader.MarkPipelineLibraryForDownload(ctx, &lib)
if err != nil {
return err
}
}
v, err := generate.ConvertPipelineToValue(pipeline.Spec)
if err != nil {
return err
}
pipelineKey := cmd.Flag("key").Value.String()
if pipelineKey == "" {
pipelineKey = textutil.NormalizeString(pipeline.Name)
}
result := map[string]dyn.Value{
"resources": dyn.V(map[string]dyn.Value{
"pipelines": dyn.V(map[string]dyn.Value{
pipelineKey: v,
}),
}),
}
err = downloader.FlushToDisk(ctx, force)
if err != nil {
return err
}
oldFilename := filepath.Join(configDir, pipelineKey+".yml")
filename := filepath.Join(configDir, pipelineKey+".pipeline.yml")
// User might continuously run generate command to update their bundle jobs with any changes made in Databricks UI.
// Due to changing in the generated file names, we need to first rename existing resource file to the new name.
// Otherwise users can end up with duplicated resources.
err = os.Rename(oldFilename, filename)
if err != nil && !errors.Is(err, fs.ErrNotExist) {
return fmt.Errorf("failed to rename file %s. DABs uses the resource type as a sub-extension for generated content, please rename it to %s, err: %w", oldFilename, filename, err)
}
saver := yamlsaver.NewSaverWithStyle(
// Including all PipelineSpec and nested fields which are map[string]string type
map[string]yaml.Style{
"spark_conf": yaml.DoubleQuotedStyle,
"custom_tags": yaml.DoubleQuotedStyle,
"configuration": yaml.DoubleQuotedStyle,
},
)
err = saver.SaveAsYAML(result, filename, force)
if err != nil {
return err
}
cmdio.LogString(ctx, "Pipeline configuration successfully saved to "+filename)
return nil
}
return cmd
}