databricks-cli/bundle/config/validate/unique_resource_keys.go

127 lines
3.5 KiB
Go
Raw Normal View History

2024-05-16 12:03:31 +00:00
package validate
import (
"context"
"fmt"
2024-05-27 12:32:01 +00:00
"slices"
"strings"
2024-05-16 12:03:31 +00:00
"github.com/databricks/cli/bundle"
"github.com/databricks/cli/libs/diag"
"github.com/databricks/cli/libs/dyn"
)
// TODO: Ensure the solution here works for dup keys in the same resource type.
func UniqueResourceKeys() bundle.ReadOnlyMutator {
return &uniqueResourceKeys{}
}
type uniqueResourceKeys struct{}
func (m *uniqueResourceKeys) Name() string {
return "validate:unique_resource_keys"
}
2024-05-27 12:32:01 +00:00
// Validate a single resource is only defined at a single location. We do not allow
// a single resource to be defined at multiple files.
// func validateSingleYamlFile(rv dyn.Value, rp dyn.Path) error {
// rrv, err := dyn.GetByPath(rv, rp)
// if err != nil {
// return err
// }
// _, err = dyn.Walk(rrv, func(p dyn.Path, v dyn.Value) (dyn.Value, error) {
// locations := v.YamlLocations()
// if len(locations) <= 1 {
// return v, nil
// }
// return v, fmt.Errorf("resource %s has been defined at multiple locations: (%s)", rp.String(), strings.Join(ls, ", "))
// })
// return err
// }
2024-05-16 12:03:31 +00:00
// TODO: Ensure all duplicate key sites are returned to the user in the diagnostics.
2024-05-16 14:04:33 +00:00
// TODO: Add unit tests for this mutator.
2024-05-27 12:32:01 +00:00
// TODO: l is not effective location because of additive semantics. Clarify this in the
// documentation.
2024-05-16 12:03:31 +00:00
func (m *uniqueResourceKeys) Apply(ctx context.Context, rb bundle.ReadOnlyBundle) diag.Diagnostics {
diags := diag.Diagnostics{}
2024-05-27 12:32:01 +00:00
// Map of resource identifiers to their paths.
// Example entry: my_job -> jobs.my_job
seenPaths := make(map[string]dyn.Path)
2024-05-16 12:03:31 +00:00
rv := rb.Config().ReadOnlyValue().Get("resources")
// Walk the resources tree and accumulate the resource identifiers.
_, err := dyn.Walk(rv, func(p dyn.Path, v dyn.Value) (dyn.Value, error) {
// The path is expected to be of length 2, and of the form <resource_type>.<resource_identifier>.
// Eg: jobs.my_job, pipelines.my_pipeline, etc.
if len(p) < 2 {
return v, nil
}
if len(p) > 2 {
return v, dyn.ErrSkip
}
// If the resource identifier already exists in the map, return an error.
k := p[1].Key()
2024-05-27 12:32:01 +00:00
if _, ok := seenPaths[k]; ok {
2024-05-16 12:03:31 +00:00
// Value of the resource that's already been seen
2024-05-27 12:32:01 +00:00
ov, _ := dyn.GetByPath(rv, seenPaths[k])
2024-05-16 12:03:31 +00:00
// Value of the newly encountered resource with a duplicate identifier.
nv, _ := dyn.GetByPath(rv, p)
// Error, encountered a duplicate resource identifier.
diags = append(diags, diag.Diagnostic{
Severity: diag.Error,
2024-05-27 12:32:01 +00:00
Summary: fmt.Sprintf("multiple resources named %s (%s at %s, %s at %s)", k, seenPaths[k].String(), ov.Location(), p.String(), nv.Location()),
2024-05-16 12:03:31 +00:00
Location: nv.Location(),
})
}
2024-05-27 12:32:01 +00:00
s := p.String()
if s == "jobs.foo" {
fmt.Println("jobs.foo")
}
yamlLocations := v.YamlLocations()
if len(yamlLocations) > 1 {
// Sort locations to make the error message deterministic.
ls := make([]string, 0, len(yamlLocations))
for _, l := range yamlLocations {
ls = append(ls, l.String())
}
slices.Sort(ls)
diags = append(diags, diag.Diagnostic{
Severity: diag.Error,
Summary: fmt.Sprintf("resource %s has been defined at multiple locations: (%s)", p.String(), strings.Join(ls, ", ")),
Location: v.Location(),
})
}
// err := validateSingleYamlFile(rv, p)
// if err != nil {
// diags = append(diags, diag.Diagnostic{
// Severity: diag.Error,
// Summary: err.Error(),
// Location: v.Location(),
// })
// }
2024-05-16 12:03:31 +00:00
// Accumulate the resource identifier and its path.
2024-05-27 12:32:01 +00:00
seenPaths[k] = p
2024-05-16 12:03:31 +00:00
return v, nil
})
if err != nil {
diags = append(diags, diag.FromErr(err)...)
}
return diags
}