2024-12-27 13:32:08 +00:00
|
|
|
package mutator
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"fmt"
|
|
|
|
|
|
|
|
"github.com/databricks/cli/bundle"
|
|
|
|
"github.com/databricks/cli/bundle/config/resources"
|
|
|
|
"github.com/databricks/cli/libs/diag"
|
|
|
|
)
|
|
|
|
|
|
|
|
type resolveSchemeDependency struct{}
|
|
|
|
|
|
|
|
// If a user defines a UC schema in the bundle, they can refer to it in DLT pipelines
|
|
|
|
// or UC Volumes using the `${resources.schemas.<schema_key>.name}` syntax. Using this
|
|
|
|
// syntax allows TF to capture the deploy time dependency this DLT pipeline or UC Volume
|
|
|
|
// has on the schema and deploy changes to the schema before deploying the pipeline or volume.
|
|
|
|
//
|
|
|
|
// This mutator translates any implicit schema references in DLT pipelines or UC Volumes
|
|
|
|
// to the explicit syntax.
|
|
|
|
func ResolveSchemaDependency() bundle.Mutator {
|
|
|
|
return &resolveSchemeDependency{}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *resolveSchemeDependency) Name() string {
|
|
|
|
return "ResolveSchemaDependency"
|
|
|
|
}
|
|
|
|
|
|
|
|
func findSchema(b *bundle.Bundle, catalogName, name string) (string, *resources.Schema) {
|
|
|
|
if catalogName == "" || name == "" {
|
|
|
|
return "", nil
|
|
|
|
}
|
|
|
|
|
|
|
|
for k, s := range b.Config.Resources.Schemas {
|
|
|
|
if s.CatalogName == catalogName && s.Name == name {
|
|
|
|
return k, s
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return "", nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func resolveVolume(v *resources.Volume, b *bundle.Bundle) {
|
|
|
|
schemaK, schema := findSchema(b, v.CatalogName, v.SchemaName)
|
|
|
|
if schema == nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
v.SchemaName = fmt.Sprintf("${resources.schemas.%s.name}", schemaK)
|
|
|
|
}
|
|
|
|
|
|
|
|
func resolvePipeline(p *resources.Pipeline, b *bundle.Bundle) {
|
|
|
|
// schema and target have the same semantics in the DLT API but are mutually
|
|
|
|
// exclusive. If schema is set, the pipeline is in direct publishing mode
|
2024-12-27 13:48:14 +00:00
|
|
|
// and can write tables to multiple schemas (vs target which is limited to a single schema).
|
2024-12-27 13:32:08 +00:00
|
|
|
schemaName := p.Schema
|
|
|
|
if schemaName == "" {
|
|
|
|
schemaName = p.Target
|
|
|
|
}
|
|
|
|
|
|
|
|
schemaK, schema := findSchema(b, p.Catalog, schemaName)
|
|
|
|
if schema == nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
if p.Schema != "" {
|
|
|
|
p.Schema = fmt.Sprintf("${resources.schemas.%s.name}", schemaK)
|
|
|
|
} else if p.Target != "" {
|
|
|
|
p.Target = fmt.Sprintf("${resources.schemas.%s.name}", schemaK)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (m *resolveSchemeDependency) Apply(ctx context.Context, b *bundle.Bundle) diag.Diagnostics {
|
|
|
|
for _, p := range b.Config.Resources.Pipelines {
|
|
|
|
resolvePipeline(p, b)
|
|
|
|
}
|
|
|
|
for _, v := range b.Config.Resources.Volumes {
|
|
|
|
resolveVolume(v, b)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|