2024-12-13 14:38:58 +00:00
|
|
|
package bundle_test
|
2023-10-18 10:20:43 +00:00
|
|
|
|
|
|
|
import (
|
2024-12-02 21:18:07 +00:00
|
|
|
"fmt"
|
2023-10-18 10:20:43 +00:00
|
|
|
"os"
|
|
|
|
"path"
|
|
|
|
"path/filepath"
|
|
|
|
"regexp"
|
|
|
|
"testing"
|
|
|
|
|
|
|
|
"github.com/databricks/cli/bundle"
|
|
|
|
"github.com/databricks/cli/bundle/config"
|
2024-02-05 15:29:45 +00:00
|
|
|
"github.com/databricks/cli/bundle/config/resources"
|
2024-08-14 09:03:44 +00:00
|
|
|
"github.com/databricks/cli/bundle/libraries"
|
2024-12-17 07:45:58 +00:00
|
|
|
"github.com/databricks/cli/integration/internal/acc"
|
2024-12-12 16:48:51 +00:00
|
|
|
"github.com/databricks/cli/internal/testcli"
|
2024-12-12 12:35:38 +00:00
|
|
|
"github.com/databricks/cli/internal/testutil"
|
2024-12-16 11:34:37 +00:00
|
|
|
"github.com/databricks/cli/libs/env"
|
2024-12-02 21:18:07 +00:00
|
|
|
"github.com/databricks/databricks-sdk-go/service/catalog"
|
2023-10-18 10:20:43 +00:00
|
|
|
"github.com/databricks/databricks-sdk-go/service/compute"
|
2024-02-05 15:29:45 +00:00
|
|
|
"github.com/databricks/databricks-sdk-go/service/jobs"
|
2024-12-02 21:18:07 +00:00
|
|
|
"github.com/google/uuid"
|
|
|
|
"github.com/stretchr/testify/assert"
|
2023-10-18 10:20:43 +00:00
|
|
|
"github.com/stretchr/testify/require"
|
|
|
|
)
|
|
|
|
|
|
|
|
func touchEmptyFile(t *testing.T, path string) {
|
|
|
|
err := os.MkdirAll(filepath.Dir(path), 0o700)
|
|
|
|
require.NoError(t, err)
|
|
|
|
f, err := os.Create(path)
|
|
|
|
require.NoError(t, err)
|
|
|
|
f.Close()
|
|
|
|
}
|
|
|
|
|
2024-12-13 14:47:50 +00:00
|
|
|
func TestUploadArtifactFileToCorrectRemotePath(t *testing.T) {
|
2024-02-05 15:29:45 +00:00
|
|
|
ctx, wt := acc.WorkspaceTest(t)
|
2023-10-18 10:20:43 +00:00
|
|
|
dir := t.TempDir()
|
|
|
|
whlPath := filepath.Join(dir, "dist", "test.whl")
|
|
|
|
touchEmptyFile(t, whlPath)
|
|
|
|
|
2024-12-12 21:28:04 +00:00
|
|
|
wsDir := acc.TemporaryWorkspaceDir(wt, "artifact-")
|
2023-10-18 10:20:43 +00:00
|
|
|
|
|
|
|
b := &bundle.Bundle{
|
2024-09-27 10:03:05 +00:00
|
|
|
BundleRootPath: dir,
|
|
|
|
SyncRootPath: dir,
|
2023-10-18 10:20:43 +00:00
|
|
|
Config: config.Root{
|
|
|
|
Bundle: config.Bundle{
|
|
|
|
Target: "whatever",
|
|
|
|
},
|
|
|
|
Workspace: config.Workspace{
|
2023-11-15 13:37:26 +00:00
|
|
|
ArtifactPath: wsDir,
|
2023-10-18 10:20:43 +00:00
|
|
|
},
|
|
|
|
Artifacts: config.Artifacts{
|
Use dynamic configuration model in bundles (#1098)
## Changes
This is a fundamental change to how we load and process bundle
configuration. We now depend on the configuration being represented as a
`dyn.Value`. This representation is functionally equivalent to Go's
`any` (it is variadic) and allows us to capture metadata associated with
a value, such as where it was defined (e.g. file, line, and column). It
also allows us to represent Go's zero values properly (e.g. empty
string, integer equal to 0, or boolean false).
Using this representation allows us to let the configuration model
deviate from the typed structure we have been relying on so far
(`config.Root`). We need to deviate from these types when using
variables for fields that are not a string themselves. For example,
using `${var.num_workers}` for an integer `workers` field was impossible
until now (though not implemented in this change).
The loader for a `dyn.Value` includes functionality to capture any and
all type mismatches between the user-defined configuration and the
expected types. These mismatches can be surfaced as validation errors in
future PRs.
Given that many mutators expect the typed struct to be the source of
truth, this change converts between the dynamic representation and the
typed representation on mutator entry and exit. Existing mutators can
continue to modify the typed representation and these modifications are
reflected in the dynamic representation (see `MarkMutatorEntry` and
`MarkMutatorExit` in `bundle/config/root.go`).
Required changes included in this change:
* The existing interpolation package is removed in favor of
`libs/dyn/dynvar`.
* Functionality to merge job clusters, job tasks, and pipeline clusters
are now all broken out into their own mutators.
To be implemented later:
* Allow variable references for non-string types.
* Surface diagnostics about the configuration provided by the user in
the validation output.
* Some mutators use a resource's configuration file path to resolve
related relative paths. These depend on `bundle/config/paths.Path` being
set and populated through `ConfigureConfigFilePath`. Instead, they
should interact with the dynamically typed configuration directly. Doing
this also unlocks being able to differentiate different base paths used
within a job (e.g. a task override with a relative path defined in a
directory other than the base job).
## Tests
* Existing unit tests pass (some have been modified to accommodate)
* Integration tests pass
2024-02-16 19:41:58 +00:00
|
|
|
"test": &config.Artifact{
|
|
|
|
Type: "whl",
|
|
|
|
Files: []config.ArtifactFile{
|
|
|
|
{
|
|
|
|
Source: whlPath,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
2023-10-18 10:20:43 +00:00
|
|
|
},
|
2024-02-05 15:29:45 +00:00
|
|
|
Resources: config.Resources{
|
|
|
|
Jobs: map[string]*resources.Job{
|
|
|
|
"test": {
|
|
|
|
JobSettings: &jobs.JobSettings{
|
|
|
|
Tasks: []jobs.Task{
|
|
|
|
{
|
|
|
|
Libraries: []compute.Library{
|
|
|
|
{
|
|
|
|
Whl: "dist/test.whl",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
2023-10-18 10:20:43 +00:00
|
|
|
},
|
|
|
|
}
|
|
|
|
|
2024-08-14 09:03:44 +00:00
|
|
|
diags := bundle.Apply(ctx, b, bundle.Seq(libraries.ExpandGlobReferences(), libraries.Upload()))
|
2024-03-25 14:18:47 +00:00
|
|
|
require.NoError(t, diags.Error())
|
2024-02-05 15:29:45 +00:00
|
|
|
|
|
|
|
// The remote path attribute on the artifact file should have been set.
|
Use dynamic configuration model in bundles (#1098)
## Changes
This is a fundamental change to how we load and process bundle
configuration. We now depend on the configuration being represented as a
`dyn.Value`. This representation is functionally equivalent to Go's
`any` (it is variadic) and allows us to capture metadata associated with
a value, such as where it was defined (e.g. file, line, and column). It
also allows us to represent Go's zero values properly (e.g. empty
string, integer equal to 0, or boolean false).
Using this representation allows us to let the configuration model
deviate from the typed structure we have been relying on so far
(`config.Root`). We need to deviate from these types when using
variables for fields that are not a string themselves. For example,
using `${var.num_workers}` for an integer `workers` field was impossible
until now (though not implemented in this change).
The loader for a `dyn.Value` includes functionality to capture any and
all type mismatches between the user-defined configuration and the
expected types. These mismatches can be surfaced as validation errors in
future PRs.
Given that many mutators expect the typed struct to be the source of
truth, this change converts between the dynamic representation and the
typed representation on mutator entry and exit. Existing mutators can
continue to modify the typed representation and these modifications are
reflected in the dynamic representation (see `MarkMutatorEntry` and
`MarkMutatorExit` in `bundle/config/root.go`).
Required changes included in this change:
* The existing interpolation package is removed in favor of
`libs/dyn/dynvar`.
* Functionality to merge job clusters, job tasks, and pipeline clusters
are now all broken out into their own mutators.
To be implemented later:
* Allow variable references for non-string types.
* Surface diagnostics about the configuration provided by the user in
the validation output.
* Some mutators use a resource's configuration file path to resolve
related relative paths. These depend on `bundle/config/paths.Path` being
set and populated through `ConfigureConfigFilePath`. Instead, they
should interact with the dynamically typed configuration directly. Doing
this also unlocks being able to differentiate different base paths used
within a job (e.g. a task override with a relative path defined in a
directory other than the base job).
## Tests
* Existing unit tests pass (some have been modified to accommodate)
* Integration tests pass
2024-02-16 19:41:58 +00:00
|
|
|
require.Regexp(t,
|
|
|
|
regexp.MustCompile(path.Join(regexp.QuoteMeta(wsDir), `.internal/test\.whl`)),
|
|
|
|
b.Config.Artifacts["test"].Files[0].RemotePath,
|
|
|
|
)
|
2024-02-05 15:29:45 +00:00
|
|
|
|
|
|
|
// The task library path should have been updated to the remote path.
|
Use dynamic configuration model in bundles (#1098)
## Changes
This is a fundamental change to how we load and process bundle
configuration. We now depend on the configuration being represented as a
`dyn.Value`. This representation is functionally equivalent to Go's
`any` (it is variadic) and allows us to capture metadata associated with
a value, such as where it was defined (e.g. file, line, and column). It
also allows us to represent Go's zero values properly (e.g. empty
string, integer equal to 0, or boolean false).
Using this representation allows us to let the configuration model
deviate from the typed structure we have been relying on so far
(`config.Root`). We need to deviate from these types when using
variables for fields that are not a string themselves. For example,
using `${var.num_workers}` for an integer `workers` field was impossible
until now (though not implemented in this change).
The loader for a `dyn.Value` includes functionality to capture any and
all type mismatches between the user-defined configuration and the
expected types. These mismatches can be surfaced as validation errors in
future PRs.
Given that many mutators expect the typed struct to be the source of
truth, this change converts between the dynamic representation and the
typed representation on mutator entry and exit. Existing mutators can
continue to modify the typed representation and these modifications are
reflected in the dynamic representation (see `MarkMutatorEntry` and
`MarkMutatorExit` in `bundle/config/root.go`).
Required changes included in this change:
* The existing interpolation package is removed in favor of
`libs/dyn/dynvar`.
* Functionality to merge job clusters, job tasks, and pipeline clusters
are now all broken out into their own mutators.
To be implemented later:
* Allow variable references for non-string types.
* Surface diagnostics about the configuration provided by the user in
the validation output.
* Some mutators use a resource's configuration file path to resolve
related relative paths. These depend on `bundle/config/paths.Path` being
set and populated through `ConfigureConfigFilePath`. Instead, they
should interact with the dynamically typed configuration directly. Doing
this also unlocks being able to differentiate different base paths used
within a job (e.g. a task override with a relative path defined in a
directory other than the base job).
## Tests
* Existing unit tests pass (some have been modified to accommodate)
* Integration tests pass
2024-02-16 19:41:58 +00:00
|
|
|
require.Regexp(t,
|
|
|
|
regexp.MustCompile(path.Join("/Workspace", regexp.QuoteMeta(wsDir), `.internal/test\.whl`)),
|
|
|
|
b.Config.Resources.Jobs["test"].JobSettings.Tasks[0].Libraries[0].Whl,
|
|
|
|
)
|
2023-10-18 10:20:43 +00:00
|
|
|
}
|
2024-04-22 11:44:34 +00:00
|
|
|
|
2024-12-13 14:47:50 +00:00
|
|
|
func TestUploadArtifactFileToCorrectRemotePathWithEnvironments(t *testing.T) {
|
2024-04-22 11:44:34 +00:00
|
|
|
ctx, wt := acc.WorkspaceTest(t)
|
|
|
|
dir := t.TempDir()
|
|
|
|
whlPath := filepath.Join(dir, "dist", "test.whl")
|
|
|
|
touchEmptyFile(t, whlPath)
|
|
|
|
|
2024-12-12 21:28:04 +00:00
|
|
|
wsDir := acc.TemporaryWorkspaceDir(wt, "artifact-")
|
2024-04-22 11:44:34 +00:00
|
|
|
|
|
|
|
b := &bundle.Bundle{
|
2024-09-27 10:03:05 +00:00
|
|
|
BundleRootPath: dir,
|
|
|
|
SyncRootPath: dir,
|
2024-04-22 11:44:34 +00:00
|
|
|
Config: config.Root{
|
|
|
|
Bundle: config.Bundle{
|
|
|
|
Target: "whatever",
|
|
|
|
},
|
|
|
|
Workspace: config.Workspace{
|
|
|
|
ArtifactPath: wsDir,
|
|
|
|
},
|
|
|
|
Artifacts: config.Artifacts{
|
|
|
|
"test": &config.Artifact{
|
|
|
|
Type: "whl",
|
|
|
|
Files: []config.ArtifactFile{
|
|
|
|
{
|
|
|
|
Source: whlPath,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
Resources: config.Resources{
|
|
|
|
Jobs: map[string]*resources.Job{
|
|
|
|
"test": {
|
|
|
|
JobSettings: &jobs.JobSettings{
|
|
|
|
Environments: []jobs.JobEnvironment{
|
|
|
|
{
|
|
|
|
Spec: &compute.Environment{
|
|
|
|
Dependencies: []string{
|
|
|
|
"dist/test.whl",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
2024-08-14 09:03:44 +00:00
|
|
|
diags := bundle.Apply(ctx, b, bundle.Seq(libraries.ExpandGlobReferences(), libraries.Upload()))
|
2024-04-22 11:44:34 +00:00
|
|
|
require.NoError(t, diags.Error())
|
|
|
|
|
|
|
|
// The remote path attribute on the artifact file should have been set.
|
|
|
|
require.Regexp(t,
|
|
|
|
regexp.MustCompile(path.Join(regexp.QuoteMeta(wsDir), `.internal/test\.whl`)),
|
|
|
|
b.Config.Artifacts["test"].Files[0].RemotePath,
|
|
|
|
)
|
|
|
|
|
|
|
|
// The job environment deps path should have been updated to the remote path.
|
|
|
|
require.Regexp(t,
|
|
|
|
regexp.MustCompile(path.Join("/Workspace", regexp.QuoteMeta(wsDir), `.internal/test\.whl`)),
|
|
|
|
b.Config.Resources.Jobs["test"].JobSettings.Environments[0].Spec.Dependencies[0],
|
|
|
|
)
|
|
|
|
}
|
2024-07-16 08:57:04 +00:00
|
|
|
|
2024-12-13 14:47:50 +00:00
|
|
|
func TestUploadArtifactFileToCorrectRemotePathForVolumes(t *testing.T) {
|
2024-07-16 08:57:04 +00:00
|
|
|
ctx, wt := acc.WorkspaceTest(t)
|
|
|
|
|
|
|
|
if os.Getenv("TEST_METASTORE_ID") == "" {
|
|
|
|
t.Skip("Skipping tests that require a UC Volume when metastore id is not set.")
|
|
|
|
}
|
|
|
|
|
2024-12-12 21:28:04 +00:00
|
|
|
volumePath := acc.TemporaryVolume(wt)
|
2024-07-16 08:57:04 +00:00
|
|
|
|
|
|
|
dir := t.TempDir()
|
|
|
|
whlPath := filepath.Join(dir, "dist", "test.whl")
|
|
|
|
touchEmptyFile(t, whlPath)
|
|
|
|
|
|
|
|
b := &bundle.Bundle{
|
2024-09-27 10:03:05 +00:00
|
|
|
BundleRootPath: dir,
|
|
|
|
SyncRootPath: dir,
|
2024-07-16 08:57:04 +00:00
|
|
|
Config: config.Root{
|
|
|
|
Bundle: config.Bundle{
|
|
|
|
Target: "whatever",
|
|
|
|
},
|
|
|
|
Workspace: config.Workspace{
|
|
|
|
ArtifactPath: volumePath,
|
|
|
|
},
|
|
|
|
Artifacts: config.Artifacts{
|
|
|
|
"test": &config.Artifact{
|
|
|
|
Type: "whl",
|
|
|
|
Files: []config.ArtifactFile{
|
|
|
|
{
|
|
|
|
Source: whlPath,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
Resources: config.Resources{
|
|
|
|
Jobs: map[string]*resources.Job{
|
|
|
|
"test": {
|
|
|
|
JobSettings: &jobs.JobSettings{
|
|
|
|
Tasks: []jobs.Task{
|
|
|
|
{
|
|
|
|
Libraries: []compute.Library{
|
|
|
|
{
|
|
|
|
Whl: "dist/test.whl",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
2024-08-14 09:03:44 +00:00
|
|
|
diags := bundle.Apply(ctx, b, bundle.Seq(libraries.ExpandGlobReferences(), libraries.Upload()))
|
2024-07-16 08:57:04 +00:00
|
|
|
require.NoError(t, diags.Error())
|
|
|
|
|
|
|
|
// The remote path attribute on the artifact file should have been set.
|
|
|
|
require.Regexp(t,
|
|
|
|
regexp.MustCompile(path.Join(regexp.QuoteMeta(volumePath), `.internal/test\.whl`)),
|
|
|
|
b.Config.Artifacts["test"].Files[0].RemotePath,
|
|
|
|
)
|
|
|
|
|
|
|
|
// The task library path should have been updated to the remote path.
|
|
|
|
require.Regexp(t,
|
|
|
|
regexp.MustCompile(path.Join(regexp.QuoteMeta(volumePath), `.internal/test\.whl`)),
|
|
|
|
b.Config.Resources.Jobs["test"].JobSettings.Tasks[0].Libraries[0].Whl,
|
|
|
|
)
|
|
|
|
}
|
2024-12-02 21:18:07 +00:00
|
|
|
|
2024-12-13 14:47:50 +00:00
|
|
|
func TestUploadArtifactFileToVolumeThatDoesNotExist(t *testing.T) {
|
2024-12-02 21:18:07 +00:00
|
|
|
ctx, wt := acc.UcWorkspaceTest(t)
|
|
|
|
w := wt.W
|
|
|
|
|
2024-12-12 12:35:38 +00:00
|
|
|
schemaName := testutil.RandomName("schema-")
|
2024-12-02 21:18:07 +00:00
|
|
|
|
|
|
|
_, err := w.Schemas.Create(ctx, catalog.CreateSchema{
|
|
|
|
CatalogName: "main",
|
|
|
|
Comment: "test schema",
|
|
|
|
Name: schemaName,
|
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
t.Cleanup(func() {
|
|
|
|
err = w.Schemas.DeleteByFullName(ctx, "main."+schemaName)
|
|
|
|
require.NoError(t, err)
|
|
|
|
})
|
|
|
|
|
2024-12-16 12:41:32 +00:00
|
|
|
bundleRoot := initTestTemplate(t, ctx, "artifact_path_with_volume", map[string]any{
|
2024-12-02 21:18:07 +00:00
|
|
|
"unique_id": uuid.New().String(),
|
|
|
|
"schema_name": schemaName,
|
|
|
|
"volume_name": "doesnotexist",
|
|
|
|
})
|
|
|
|
|
2024-12-16 11:34:37 +00:00
|
|
|
ctx = env.Set(ctx, "BUNDLE_ROOT", bundleRoot)
|
|
|
|
stdout, stderr, err := testcli.RequireErrorRun(t, ctx, "bundle", "deploy")
|
2024-12-02 21:18:07 +00:00
|
|
|
|
|
|
|
assert.Error(t, err)
|
|
|
|
assert.Equal(t, fmt.Sprintf(`Error: volume /Volumes/main/%s/doesnotexist does not exist: Not Found
|
|
|
|
at workspace.artifact_path
|
|
|
|
in databricks.yml:6:18
|
|
|
|
|
|
|
|
`, schemaName), stdout.String())
|
|
|
|
assert.Equal(t, "", stderr.String())
|
|
|
|
}
|
|
|
|
|
2024-12-13 14:47:50 +00:00
|
|
|
func TestUploadArtifactToVolumeNotYetDeployed(t *testing.T) {
|
2024-12-02 21:18:07 +00:00
|
|
|
ctx, wt := acc.UcWorkspaceTest(t)
|
|
|
|
w := wt.W
|
|
|
|
|
2024-12-12 12:35:38 +00:00
|
|
|
schemaName := testutil.RandomName("schema-")
|
2024-12-02 21:18:07 +00:00
|
|
|
|
|
|
|
_, err := w.Schemas.Create(ctx, catalog.CreateSchema{
|
|
|
|
CatalogName: "main",
|
|
|
|
Comment: "test schema",
|
|
|
|
Name: schemaName,
|
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
t.Cleanup(func() {
|
|
|
|
err = w.Schemas.DeleteByFullName(ctx, "main."+schemaName)
|
|
|
|
require.NoError(t, err)
|
|
|
|
})
|
|
|
|
|
2024-12-16 12:41:32 +00:00
|
|
|
bundleRoot := initTestTemplate(t, ctx, "artifact_path_with_volume", map[string]any{
|
2024-12-02 21:18:07 +00:00
|
|
|
"unique_id": uuid.New().String(),
|
|
|
|
"schema_name": schemaName,
|
|
|
|
"volume_name": "my_volume",
|
|
|
|
})
|
|
|
|
|
2024-12-16 11:34:37 +00:00
|
|
|
ctx = env.Set(ctx, "BUNDLE_ROOT", bundleRoot)
|
|
|
|
stdout, stderr, err := testcli.RequireErrorRun(t, ctx, "bundle", "deploy")
|
2024-12-02 21:18:07 +00:00
|
|
|
|
|
|
|
assert.Error(t, err)
|
|
|
|
assert.Equal(t, fmt.Sprintf(`Error: volume /Volumes/main/%s/my_volume does not exist: Not Found
|
|
|
|
at workspace.artifact_path
|
|
|
|
resources.volumes.foo
|
|
|
|
in databricks.yml:6:18
|
|
|
|
databricks.yml:11:7
|
|
|
|
|
|
|
|
You are using a volume in your artifact_path that is managed by
|
|
|
|
this bundle but which has not been deployed yet. Please first deploy
|
|
|
|
the volume using 'bundle deploy' and then switch over to using it in
|
|
|
|
the artifact_path.
|
|
|
|
|
|
|
|
`, schemaName), stdout.String())
|
|
|
|
assert.Equal(t, "", stderr.String())
|
|
|
|
}
|