From 3e1e169225da28299e7c1deae4f818511bc80823 Mon Sep 17 00:00:00 2001 From: Lennart Kats Date: Mon, 16 Dec 2024 10:33:48 +0100 Subject: [PATCH] Add reflection/dyn-based tests --- bundle/config/mutator/apply_presets.go | 28 +- bundle/config/mutator/apply_presets_test.go | 431 ++++++++------------ 2 files changed, 189 insertions(+), 270 deletions(-) diff --git a/bundle/config/mutator/apply_presets.go b/bundle/config/mutator/apply_presets.go index 3866ae57f..7cfbfd851 100644 --- a/bundle/config/mutator/apply_presets.go +++ b/bundle/config/mutator/apply_presets.go @@ -244,23 +244,23 @@ func (m *applyPresets) Apply(ctx context.Context, b *bundle.Bundle) diag.Diagnos // Quality monitors presets // Supported: Schedule, Catalog, Schema // Not supported: Tags (not in API as of 2024-10) - if t.TriggerPauseStatus == config.Paused { - for key, q := range r.QualityMonitors { - if q.CreateMonitor == nil { - diags = diags.Extend(diag.Errorf("quality monitor %s is not defined", key)) - continue - } - // Remove all schedules from monitors, since they don't support pausing/unpausing. - // Quality monitors might support the "pause" property in the future, so at the - // CLI level we do respect that property if it is set to "unpaused." + for key, q := range r.QualityMonitors { + if q.CreateMonitor == nil { + diags = diags.Extend(diag.Errorf("quality monitor %s is not defined", key)) + continue + } + // Remove all schedules from monitors, since they don't support pausing/unpausing. + // Quality monitors might support the "pause" property in the future, so at the + // CLI level we do respect that property if it is set to "unpaused." + if t.TriggerPauseStatus == config.Paused { if q.Schedule != nil && q.Schedule.PauseStatus != catalog.MonitorCronSchedulePauseStatusUnpaused { q.Schedule = nil } - if t.Catalog != "" && t.Schema != "" { - parts := strings.Split(q.TableName, ".") - if len(parts) != 3 { - q.TableName = fmt.Sprintf("%s.%s.%s", t.Catalog, t.Schema, q.TableName) - } + } + if t.Catalog != "" && t.Schema != "" { + q.TableName = fullyQualifyName(q.TableName, t.Catalog, t.Schema) + if q.OutputSchemaName == "" { + q.OutputSchemaName = t.Catalog + "." + t.Schema } } } diff --git a/bundle/config/mutator/apply_presets_test.go b/bundle/config/mutator/apply_presets_test.go index fd99dc212..5a05115c4 100644 --- a/bundle/config/mutator/apply_presets_test.go +++ b/bundle/config/mutator/apply_presets_test.go @@ -2,10 +2,8 @@ package mutator_test import ( "context" - "fmt" "reflect" "runtime" - "strconv" "strings" "testing" @@ -17,18 +15,17 @@ import ( "github.com/databricks/cli/libs/dbr" "github.com/databricks/cli/libs/dyn" "github.com/databricks/databricks-sdk-go/service/catalog" - "github.com/databricks/databricks-sdk-go/service/compute" - "github.com/databricks/databricks-sdk-go/service/dashboards" "github.com/databricks/databricks-sdk-go/service/jobs" - "github.com/databricks/databricks-sdk-go/service/ml" "github.com/databricks/databricks-sdk-go/service/pipelines" "github.com/databricks/databricks-sdk-go/service/serving" "github.com/stretchr/testify/require" ) -type RecordedField struct { - Path string - Value string +type recordedField struct { + Path dyn.Path + PathString string + Placeholder string + Expected string } func TestApplyPresetsPrefix(t *testing.T) { @@ -473,7 +470,7 @@ func TestApplyPresetsCatalogSchema(t *testing.T) { Config: config.Root{ Resources: config.Resources{ Jobs: map[string]*resources.Job{ - "object": { + "key": { JobSettings: &jobs.JobSettings{ Name: "job", Parameters: []jobs.JobParameterDefinition{ @@ -484,7 +481,7 @@ func TestApplyPresetsCatalogSchema(t *testing.T) { }, }, Pipelines: map[string]*resources.Pipeline{ - "object": { + "key": { PipelineSpec: &pipelines.PipelineSpec{ Name: "pipeline", Catalog: "", @@ -493,7 +490,7 @@ func TestApplyPresetsCatalogSchema(t *testing.T) { }, }, ModelServingEndpoints: map[string]*resources.ModelServingEndpoint{ - "object": { + "key": { CreateServingEndpoint: &serving.CreateServingEndpoint{ Name: "serving", AiGateway: &serving.AiGatewayConfig{ @@ -518,7 +515,7 @@ func TestApplyPresetsCatalogSchema(t *testing.T) { }, }, RegisteredModels: map[string]*resources.RegisteredModel{ - "object": { + "key": { CreateRegisteredModelRequest: &catalog.CreateRegisteredModelRequest{ Name: "registered_model", CatalogName: "", @@ -527,49 +524,21 @@ func TestApplyPresetsCatalogSchema(t *testing.T) { }, }, QualityMonitors: map[string]*resources.QualityMonitor{ - "object": { - TableName: "table", + "key": { + TableName: "..table", CreateMonitor: &catalog.CreateMonitor{ OutputSchemaName: ".", }, }, }, Schemas: map[string]*resources.Schema{ - "object": { + "key": { CreateSchema: &catalog.CreateSchema{ Name: "", CatalogName: "", }, }, }, - Models: map[string]*resources.MlflowModel{ - "object": { - Model: &ml.Model{ - Name: "..model", - }, - }, - }, - Experiments: map[string]*resources.MlflowExperiment{ - "object": { - Experiment: &ml.Experiment{ - Name: "..experiment", - }, - }, - }, - Clusters: map[string]*resources.Cluster{ - "object": { - ClusterSpec: &compute.ClusterSpec{ - ClusterName: "cluster", - }, - }, - }, - Dashboards: map[string]*resources.Dashboard{ - "object": { - Dashboard: &dashboards.Dashboard{ - DisplayName: "dashboard", - }, - }, - }, }, }, } @@ -577,243 +546,194 @@ func TestApplyPresetsCatalogSchema(t *testing.T) { Catalog: "my_catalog", Schema: "my_schema", } - - // Stage 1: Apply presets BEFORE cleanup. - // Because all fields are already set to placeholders, Apply should NOT overwrite them (no-op). ctx := context.Background() + + // Initial scan: record all fields that contain placeholders. + // We do this before the first apply so we can verify no changes occur. + var recordedFields []recordedField + require.NoError(t, b.Config.Mutate(func(root dyn.Value) (dyn.Value, error) { + _, err := dyn.Walk(b.Config.Value(), func(p dyn.Path, v dyn.Value) (dyn.Value, error) { + if v.Kind() == dyn.KindString { + val := v.MustString() + if strings.Contains(val, "") || strings.Contains(val, "") { + pathCopy := make(dyn.Path, len(p)) + copy(pathCopy, p) + recordedFields = append(recordedFields, recordedField{ + Path: pathCopy, + PathString: pathCopy.String(), + Placeholder: val, + Expected: replacePlaceholders(val, "my_catalog", "my_schema"), + }) + } + } + return v, nil + }) + return root, err + })) + + // Stage 1: Apply presets before cleanup, should be no-op. diags := bundle.Apply(ctx, b, mutator.ApplyPresets()) require.False(t, diags.HasError(), "unexpected error before cleanup: %v", diags.Error()) - verifyNoChangesBeforeCleanup(t, b.Config) - // Stage 2: Cleanup all "" and "" placeholders - // and record where they were. - b.Config.MarkMutatorEntry(ctx) - resources := reflect.ValueOf(&b.Config.Resources).Elem() - recordedFields := recordAndCleanupFields(resources, "Resources") - b.Config.Resources.Jobs["object"].Parameters = nil - b.Config.MarkMutatorExit(ctx) + // Verify that no recorded fields changed + verifyNoChangesBeforeCleanup(t, b.Config.Value(), recordedFields) + + // Stage 2: Cleanup: Walk over rootVal and remove placeholders, adjusting recordedFields Expected values. + require.NoError(t, b.Config.Mutate(func(root dyn.Value) (dyn.Value, error) { + for _, f := range recordedFields { + value, err := dyn.GetByPath(root, f.Path) + require.NoError(t, err) + + val := value.MustString() + cleanedVal := removePlaceholders(val) + root, err = dyn.SetByPath(root, f.Path, dyn.V(cleanedVal)) + require.NoError(t, err) + } + root, err := dyn.Set(root, "resources.jobs.key.parameters", dyn.NilValue) + require.NoError(t, err) + return root, nil + })) // Stage 3: Apply presets after cleanup. diags = bundle.Apply(ctx, b, mutator.ApplyPresets()) require.False(t, diags.HasError(), "unexpected error after cleanup: %v", diags.Error()) - verifyAllFields(t, b.Config, recordedFields) - // Stage 4: Verify that all known fields in config.Resources have been processed. - checkCompleteness(t, &b.Config.Resources, "Resources", recordedFields) -} - -func verifyNoChangesBeforeCleanup(t *testing.T, cfg config.Root) { - t.Helper() - - // Just check a few representative fields to ensure they are still placeholders. - // For example: Job parameter defaults should still have "" and "" - jobParams := cfg.Resources.Jobs["object"].Parameters - require.Len(t, jobParams, 2, "job parameters count mismatch") - require.Equal(t, "", jobParams[0].Default, "expected no changes before cleanup") - require.Equal(t, "", jobParams[1].Default, "expected no changes before cleanup") - - pipeline := cfg.Resources.Pipelines["object"] - require.Equal(t, "", pipeline.Catalog, "expected no changes before cleanup") - require.Equal(t, "", pipeline.Target, "expected no changes before cleanup") -} - -// recordAndCleanupFields recursively finds all Catalog/CatalogName/Schema/SchemaName fields, -// records their original values, and replaces them with empty strings. -func recordAndCleanupFields(rv reflect.Value, path string) []RecordedField { - var recordedFields []RecordedField - - switch rv.Kind() { - case reflect.Ptr, reflect.Interface: - if !rv.IsNil() { - recordedFields = append(recordedFields, recordAndCleanupFields(rv.Elem(), path)...) - } - - case reflect.Struct: - tp := rv.Type() - for i := 0; i < rv.NumField(); i++ { - ft := tp.Field(i) - fv := rv.Field(i) - fPath := path + "." + ft.Name - - if fv.Kind() == reflect.String { - original := fv.String() - newVal := cleanedValue(original) - if newVal != original { - fv.SetString(newVal) - recordedFields = append(recordedFields, RecordedField{fPath, original}) - } - } - - recordedFields = append(recordedFields, recordAndCleanupFieldsRecursive(fv, fPath)...) - } - - case reflect.Map: - for _, mk := range rv.MapKeys() { - mVal := rv.MapIndex(mk) - recordedFields = append(recordedFields, recordAndCleanupFieldsRecursive(mVal, path+"."+mk.String())...) - } - - case reflect.Slice, reflect.Array: - for i := 0; i < rv.Len(); i++ { - recordedFields = append(recordedFields, recordAndCleanupFieldsRecursive(rv.Index(i), fmt.Sprintf("%s[%d]", path, i))...) - } - } - - return recordedFields -} - -// verifyAllFields checks if all collected fields are now properly replaced after ApplyPresets. -func verifyAllFields(t *testing.T, cfg config.Root, recordedFields []RecordedField) { - t.Helper() + // Verify that fields have the expected replacements + config := b.Config.Value() for _, f := range recordedFields { - expected := replaceCatalogSchemaPlaceholders(f.Value) - got := getStringValueAtPath(t, reflect.ValueOf(cfg), f.Path) - require.Equal(t, expected, got, "expected catalog/schema to be replaced by preset values at %s", f.Path) + val, err := dyn.GetByPath(config, f.Path) + require.NoError(t, err, "failed to get path %s", f.Path) + require.Equal(t, f.Expected, val.MustString(), "preset value expected for %s based on placeholder %s", f.Path, f.Placeholder) + } + + // Stage 4: Check completeness + ignoredFields := map[string]string{ + // Any fields that should be ignored in the completeness check + // Example: + // "resources.jobs.object.schema_something": "this property doesn't relate to the catalog/schema", + } + checkCompleteness(t, recordedFields, ignoredFields) +} + +func verifyNoChangesBeforeCleanup(t *testing.T, rootVal dyn.Value, recordedFields []recordedField) { + t.Helper() + + for _, f := range recordedFields { + val, err := dyn.GetByPath(rootVal, f.Path) + require.NoError(t, err, "failed to get path %s", f.Path) + require.Equal(t, f.Placeholder, val.MustString(), + "expected placeholder '%s' at %s to remain unchanged before cleanup", f.Placeholder, f.Path) } } -// checkCompleteness ensures that all catalog/schema fields have been processed. -func checkCompleteness(t *testing.T, root interface{}, rootPath string, recordedFields []RecordedField) { +func checkCompleteness(t *testing.T, recordedFields []recordedField, ignoredFields map[string]string) { t.Helper() - recordedSet := make(map[string]bool) - for _, f := range recordedFields { - recordedSet[f.Path] = true + + // Build a set for recorded fields + recordedSet := make(map[string]struct{}) + for _, field := range recordedFields { + recordedSet[field.PathString] = struct{}{} } - var check func(rv reflect.Value, path string) - check = func(rv reflect.Value, path string) { - switch rv.Kind() { - case reflect.Ptr, reflect.Interface: - if !rv.IsNil() { - check(rv.Elem(), path) - } - case reflect.Struct: - tp := rv.Type() - for i := 0; i < rv.NumField(); i++ { - ft := tp.Field(i) - fv := rv.Field(i) - fPath := path + "." + ft.Name - if isCatalogOrSchemaField(ft.Name) { - require.Truef(t, recordedSet[fPath], - "Field %s was not recorded in recordedFields (completeness check failed)", fPath) - } - check(fv, fPath) - } - case reflect.Map: - for _, mk := range rv.MapKeys() { - mVal := rv.MapIndex(mk) - check(mVal, path+"."+mk.String()) - } + // Obtain the type of config.Resources + var r config.Resources + resourcesType := reflect.TypeOf(r) + + // Track missing fields + var missingFields []string + + // Keep track of visited types to prevent infinite loops (cycles) + visited := make(map[reflect.Type]struct{}) + + // Helper function to handle maps, slices, arrays, and nested pointers/interfaces + verifyFieldType := func(fieldType reflect.Type, path string, fn func(reflect.Type, string)) { + switch fieldType.Kind() { case reflect.Slice, reflect.Array: - for i := 0; i < rv.Len(); i++ { - check(rv.Index(i), fmt.Sprintf("%s[%d]", path, i)) - } - } - } - - rv := reflect.ValueOf(root) - if rv.Kind() == reflect.Ptr { - rv = rv.Elem() - } - check(rv, rootPath) -} - -// getStringValueAtPath navigates the given path and returns the string value at that path. -func getStringValueAtPath(t *testing.T, root reflect.Value, path string) string { - t.Helper() - parts := strings.Split(path, ".") - return navigatePath(t, root, parts) -} - -func navigatePath(t *testing.T, rv reflect.Value, parts []string) string { - t.Helper() - - // Trim empty parts if any - for len(parts) > 0 && parts[0] == "" { - parts = parts[1:] - } - - for len(parts) > 0 { - part := parts[0] - parts = parts[1:] - - // Dereference pointers/interfaces before proceeding - for rv.Kind() == reflect.Ptr || rv.Kind() == reflect.Interface { - require.Falsef(t, rv.IsNil(), "nil pointer or interface encountered at part '%s'", part) - rv = rv.Elem() - } - - // If the part has indexing like "Parameters[0]", split it into "Parameters" and "[0]" - var indexPart string - fieldName := part - if idx := strings.IndexRune(part, '['); idx != -1 { - // e.g. part = "Parameters[0]" - fieldName = part[:idx] // "Parameters" - indexPart = part[idx:] // "[0]" - require.Truef(t, strings.HasPrefix(indexPart, "["), "expected '[' in indexing") - require.Truef(t, strings.HasSuffix(indexPart, "]"), "expected ']' at end of indexing") - } - - // Navigate down structures/maps - switch rv.Kind() { - case reflect.Struct: - // Find the struct field by name - ft, ok := rv.Type().FieldByName(fieldName) - if !ok { - t.Fatalf("Could not find field '%s' in struct at path", fieldName) - } - rv = rv.FieldByIndex(ft.Index) - + // For arrays/slices, inspect the element type + fn(fieldType.Elem(), path+"[0]") case reflect.Map: - // Use fieldName as map key - mapVal := rv.MapIndex(reflect.ValueOf(fieldName)) - require.Truef(t, mapVal.IsValid(), "no map entry '%s' found in path", fieldName) - rv = mapVal - - default: - // If we're here, maybe we expected a struct or map but got something else - t.Fatalf("Unexpected kind '%s' when looking for '%s'", rv.Kind(), fieldName) - } - - // If there's an index part, apply it now - if indexPart != "" { - // Dereference again if needed - for rv.Kind() == reflect.Ptr || rv.Kind() == reflect.Interface { - require.False(t, rv.IsNil(), "nil pointer or interface when indexing") - rv = rv.Elem() + // For maps, inspect the value type + fn(fieldType.Elem(), path+".key") + case reflect.Ptr, reflect.Interface: + // For pointers/interfaces, inspect the element if it's a pointer + if fieldType.Kind() == reflect.Ptr { + fn(fieldType.Elem(), path) } - - require.Truef(t, rv.Kind() == reflect.Slice || rv.Kind() == reflect.Array, "expected slice/array for indexing but got %s", rv.Kind()) - - idxStr := indexPart[1 : len(indexPart)-1] // remove [ and ] - idx, err := strconv.Atoi(idxStr) - require.NoError(t, err, "invalid slice index %s", indexPart) - - require.Truef(t, idx < rv.Len(), "index %d out of range in slice/array of length %d", idx, rv.Len()) - rv = rv.Index(idx) + case reflect.Struct: + // For structs, directly recurse into their fields + fn(fieldType, path) + default: + // For basic or unknown kinds, do nothing } } - // Dereference if needed at the leaf - for rv.Kind() == reflect.Ptr || rv.Kind() == reflect.Interface { - require.False(t, rv.IsNil(), "nil pointer or interface at leaf") - rv = rv.Elem() + // Recursive function to verify the fields of a given type. + var verifyTypeFields func(rt reflect.Type, path string) + verifyTypeFields = func(rt reflect.Type, path string) { + // Avoid cycles by skipping already visited types + if _, seen := visited[rt]; seen { + return + } + visited[rt] = struct{}{} + + switch rt.Kind() { + case reflect.Ptr, reflect.Interface: + // For pointers/interfaces, inspect the element type if available + if rt.Kind() == reflect.Ptr { + verifyTypeFields(rt.Elem(), path) + } + case reflect.Struct: + for i := 0; i < rt.NumField(); i++ { + ft := rt.Field(i) + jsonTag := ft.Tag.Get("json") + if jsonTag == "" || jsonTag == "-" { + // Ignore field names when there's no JSON tag, + // e.g. for Jobs.JobSettings + verifyFieldType(ft.Type, path, verifyTypeFields) + continue + } + + fieldName := strings.Split(jsonTag, ",")[0] + fieldPath := path + "." + fieldName + + if isCatalogOrSchemaField(fieldName) { + // Only check if the field is a string + if ft.Type.Kind() == reflect.String { + if _, recorded := recordedSet[fieldPath]; !recorded { + if _, ignored := ignoredFields[fieldPath]; !ignored { + missingFields = append(missingFields, fieldPath) + } + } + } + } + + verifyFieldType(ft.Type, fieldPath, verifyTypeFields) + } + default: + // For other kinds at this level, do nothing + } } - require.Equal(t, reflect.String, rv.Kind(), "expected a string at the final path") - return rv.String() + // Start from "resources" + verifyTypeFields(resourcesType, "resources") + + // Report all missing fields + for _, field := range missingFields { + t.Errorf("Field %s was not included in the test (should be covered in 'recordedFields' or 'ignoredFields')", field) + } + + // Fail the test if there were any missing fields + if len(missingFields) > 0 { + t.FailNow() + } } +// isCatalogOrSchemaField returns true for a field names in config.Resources that we suspect could contain a catalog or schema name func isCatalogOrSchemaField(name string) bool { - switch name { - case "Catalog", "CatalogName", "Schema", "SchemaName", "Target": - return true - default: - return false - } + return strings.Contains(name, "catalog") || strings.Contains(name, "schema") } -func cleanedValue(value string) string { +func removePlaceholders(value string) string { value = strings.ReplaceAll(value, ".", "") value = strings.ReplaceAll(value, ".", "") value = strings.ReplaceAll(value, "", "") @@ -821,9 +741,8 @@ func cleanedValue(value string) string { return value } -// replaceCatalogSchemaPlaceholders replaces placeholders with the final expected values. -func replaceCatalogSchemaPlaceholders(value string) string { - value = strings.ReplaceAll(value, "", "my_catalog") - value = strings.ReplaceAll(value, "", "my_schema") - return value +func replacePlaceholders(placeholder, catalog, schema string) string { + expected := strings.ReplaceAll(placeholder, "", catalog) + expected = strings.ReplaceAll(expected, "", schema) + return expected }