databricks-cli/bundle/config/loader/process_include.go

186 lines
4.6 KiB
Go
Raw Normal View History

package loader
import (
"context"
"fmt"
2024-09-24 14:39:02 +00:00
"sort"
"strings"
"github.com/databricks/cli/bundle"
"github.com/databricks/cli/bundle/config"
"github.com/databricks/cli/libs/diag"
"github.com/databricks/cli/libs/dyn"
2024-09-24 14:39:02 +00:00
"golang.org/x/exp/maps"
)
var resourceTypes = []string{
"job",
"pipeline",
"model",
"experiment",
"model_serving_endpoint",
"registered_model",
"quality_monitor",
"schema",
2024-09-24 15:39:20 +00:00
"cluster",
}
2024-09-24 12:39:28 +00:00
func validateFileFormat(r *config.Root, filePath string) diag.Diagnostics {
for _, typ := range resourceTypes {
for _, ext := range []string{fmt.Sprintf(".%s.yml", typ), fmt.Sprintf(".%s.yaml", typ)} {
if strings.HasSuffix(filePath, ext) {
return validateSingleResourceDefined(r, ext, typ)
}
}
}
return nil
}
2024-09-24 12:39:28 +00:00
func validateSingleResourceDefined(r *config.Root, ext, typ string) diag.Diagnostics {
type resource struct {
path dyn.Path
value dyn.Value
typ string
key string
}
resources := []resource{}
2024-09-24 12:39:28 +00:00
// Gather all resources defined in the resources block.
_, err := dyn.MapByPattern(
r.Value(),
dyn.NewPattern(dyn.Key("resources"), dyn.AnyKey(), dyn.AnyKey()),
func(p dyn.Path, v dyn.Value) (dyn.Value, error) {
// The key for the resource. Eg: "my_job" for jobs.my_job.
k := p[2].Key()
// The type of the resource. Eg: "job" for jobs.my_job.
typ := strings.TrimSuffix(p[1].Key(), "s")
2024-09-24 12:39:28 +00:00
resources = append(resources, resource{path: p, value: v, typ: typ, key: k})
return v, nil
})
if err != nil {
2024-09-24 12:39:28 +00:00
return diag.FromErr(err)
}
// Gather all resources defined in a target block.
_, err = dyn.MapByPattern(
r.Value(),
dyn.NewPattern(dyn.Key("targets"), dyn.AnyKey(), dyn.Key("resources"), dyn.AnyKey(), dyn.AnyKey()),
func(p dyn.Path, v dyn.Value) (dyn.Value, error) {
2024-09-24 12:39:28 +00:00
// The key for the resource. Eg: "my_job" for jobs.my_job.
k := p[4].Key()
2024-09-24 12:39:28 +00:00
// The type of the resource. Eg: "job" for jobs.my_job.
typ := strings.TrimSuffix(p[3].Key(), "s")
2024-09-24 12:39:28 +00:00
resources = append(resources, resource{path: p, value: v, typ: typ, key: k})
return v, nil
2024-09-24 12:39:28 +00:00
})
if err != nil {
return diag.FromErr(err)
}
valid := true
seenKeys := map[string]struct{}{}
for _, rr := range resources {
if len(seenKeys) == 0 {
seenKeys[rr.key] = struct{}{}
continue
}
if _, ok := seenKeys[rr.key]; !ok {
valid = false
break
}
if rr.typ != typ {
valid = false
break
}
}
// The file only contains one resource defined in its resources or targets block,
// and the resource is of the correct type.
if valid {
return nil
}
msg := strings.Builder{}
2024-09-24 14:39:02 +00:00
msg.WriteString(fmt.Sprintf("We recommend only defining a single %s in a file with the %s extension.\n", typ, ext))
// Dedup the list of resources before adding them the diagnostic message. This
// is needed because we do not dedup earlier when gathering the resources and
// it's valid to define the same resource in both the resources and targets block.
2024-09-24 12:39:28 +00:00
msg.WriteString("The following resources are defined or configured in this file:\n")
2024-09-24 14:39:02 +00:00
setOfLines := map[string]struct{}{}
2024-09-24 12:39:28 +00:00
for _, r := range resources {
2024-09-24 14:39:02 +00:00
setOfLines[fmt.Sprintf(" - %s (%s)\n", r.key, r.typ)] = struct{}{}
}
// Sort the line s to print to make the output deterministic.
listOfLines := maps.Keys(setOfLines)
sort.Strings(listOfLines)
for _, l := range listOfLines {
msg.WriteString(l)
2024-09-24 12:39:28 +00:00
}
locations := []dyn.Location{}
paths := []dyn.Path{}
for _, rr := range resources {
locations = append(locations, rr.value.Locations()...)
paths = append(paths, rr.path)
}
2024-09-24 14:39:02 +00:00
// Sort the locations and paths to make the output deterministic.
sort.Slice(locations, func(i, j int) bool {
return locations[i].String() < locations[j].String()
})
sort.Slice(paths, func(i, j int) bool {
return paths[i].String() < paths[j].String()
})
2024-09-24 12:39:28 +00:00
return diag.Diagnostics{
{
Severity: diag.Info,
Summary: msg.String(),
Locations: locations,
Paths: paths,
},
2024-09-24 12:39:28 +00:00
}
}
type processInclude struct {
fullPath string
relPath string
}
// ProcessInclude loads the configuration at [fullPath] and merges it into the configuration.
func ProcessInclude(fullPath, relPath string) bundle.Mutator {
return &processInclude{
fullPath: fullPath,
relPath: relPath,
}
}
func (m *processInclude) Name() string {
return fmt.Sprintf("ProcessInclude(%s)", m.relPath)
}
func (m *processInclude) Apply(_ context.Context, b *bundle.Bundle) diag.Diagnostics {
this, diags := config.Load(m.fullPath)
if diags.HasError() {
return diags
}
2024-09-24 12:39:28 +00:00
// Add any diagnostics associated with the file format.
diags = append(diags, validateFileFormat(this, m.relPath)...)
2024-09-24 15:42:03 +00:00
if diags.HasError() {
return diags
}
err := b.Config.Merge(this)
if err != nil {
diags = diags.Extend(diag.FromErr(err))
}
return diags
}