2024-12-13 14:38:58 +00:00
|
|
|
package bundle_test
|
2024-01-17 14:26:33 +00:00
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"os"
|
|
|
|
"path"
|
|
|
|
"path/filepath"
|
2025-01-07 10:49:23 +00:00
|
|
|
"strconv"
|
2024-01-17 14:26:33 +00:00
|
|
|
"strings"
|
|
|
|
"testing"
|
|
|
|
|
2024-12-17 07:45:58 +00:00
|
|
|
"github.com/databricks/cli/integration/internal/acc"
|
2024-12-12 16:48:51 +00:00
|
|
|
"github.com/databricks/cli/internal/testcli"
|
2024-01-17 14:26:33 +00:00
|
|
|
"github.com/databricks/cli/internal/testutil"
|
2024-12-16 11:34:37 +00:00
|
|
|
"github.com/databricks/cli/libs/env"
|
2024-01-17 14:26:33 +00:00
|
|
|
"github.com/databricks/cli/libs/filer"
|
|
|
|
"github.com/databricks/databricks-sdk-go"
|
|
|
|
"github.com/databricks/databricks-sdk-go/service/compute"
|
|
|
|
"github.com/databricks/databricks-sdk-go/service/jobs"
|
|
|
|
"github.com/google/uuid"
|
|
|
|
"github.com/stretchr/testify/require"
|
|
|
|
)
|
|
|
|
|
2024-12-13 14:47:50 +00:00
|
|
|
func TestGenerateFromExistingJobAndDeploy(t *testing.T) {
|
2024-02-07 11:18:56 +00:00
|
|
|
ctx, wt := acc.WorkspaceTest(t)
|
2024-12-12 21:28:04 +00:00
|
|
|
gt := &generateJobTest{T: wt, w: wt.W}
|
2024-01-17 14:26:33 +00:00
|
|
|
|
|
|
|
uniqueId := uuid.New().String()
|
2024-12-16 12:41:32 +00:00
|
|
|
bundleRoot := initTestTemplate(t, ctx, "with_includes", map[string]any{
|
2024-01-17 14:26:33 +00:00
|
|
|
"unique_id": uniqueId,
|
|
|
|
})
|
|
|
|
|
2024-02-07 11:18:56 +00:00
|
|
|
jobId := gt.createTestJob(ctx)
|
2024-01-17 14:26:33 +00:00
|
|
|
t.Cleanup(func() {
|
2024-02-07 11:18:56 +00:00
|
|
|
gt.destroyJob(ctx, jobId)
|
2024-01-17 14:26:33 +00:00
|
|
|
})
|
|
|
|
|
2024-12-16 11:34:37 +00:00
|
|
|
ctx = env.Set(ctx, "BUNDLE_ROOT", bundleRoot)
|
|
|
|
c := testcli.NewRunner(t, ctx, "bundle", "generate", "job",
|
2025-01-07 10:49:23 +00:00
|
|
|
"--existing-job-id", strconv.FormatInt(jobId, 10),
|
2024-01-17 14:26:33 +00:00
|
|
|
"--config-dir", filepath.Join(bundleRoot, "resources"),
|
|
|
|
"--source-dir", filepath.Join(bundleRoot, "src"))
|
2024-12-16 12:41:32 +00:00
|
|
|
_, _, err := c.Run()
|
2024-01-17 14:26:33 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
_, err = os.Stat(filepath.Join(bundleRoot, "src", "test.py"))
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
2024-01-31 10:23:35 +00:00
|
|
|
matches, err := filepath.Glob(filepath.Join(bundleRoot, "resources", "generated_job_*.yml"))
|
2024-01-17 14:26:33 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, matches, 1)
|
|
|
|
|
|
|
|
// check the content of generated yaml
|
|
|
|
data, err := os.ReadFile(matches[0])
|
|
|
|
require.NoError(t, err)
|
|
|
|
generatedYaml := string(data)
|
|
|
|
require.Contains(t, generatedYaml, "notebook_task:")
|
2025-01-07 10:49:23 +00:00
|
|
|
require.Contains(t, generatedYaml, "notebook_path: "+filepath.Join("..", "src", "test.py"))
|
2024-01-17 14:26:33 +00:00
|
|
|
require.Contains(t, generatedYaml, "task_key: test")
|
|
|
|
require.Contains(t, generatedYaml, "new_cluster:")
|
|
|
|
require.Contains(t, generatedYaml, "spark_version: 13.3.x-scala2.12")
|
|
|
|
require.Contains(t, generatedYaml, "num_workers: 1")
|
|
|
|
|
2024-12-16 12:41:32 +00:00
|
|
|
deployBundle(t, ctx, bundleRoot)
|
2024-01-17 14:26:33 +00:00
|
|
|
|
2024-12-16 12:41:32 +00:00
|
|
|
destroyBundle(t, ctx, bundleRoot)
|
2024-02-07 11:18:56 +00:00
|
|
|
}
|
2024-01-17 14:26:33 +00:00
|
|
|
|
2024-02-07 11:18:56 +00:00
|
|
|
type generateJobTest struct {
|
2024-12-12 21:28:04 +00:00
|
|
|
T *acc.WorkspaceT
|
2024-02-07 11:18:56 +00:00
|
|
|
w *databricks.WorkspaceClient
|
2024-01-17 14:26:33 +00:00
|
|
|
}
|
|
|
|
|
2024-02-07 11:18:56 +00:00
|
|
|
func (gt *generateJobTest) createTestJob(ctx context.Context) int64 {
|
|
|
|
t := gt.T
|
|
|
|
w := gt.w
|
|
|
|
|
2024-12-12 21:28:04 +00:00
|
|
|
tmpdir := acc.TemporaryWorkspaceDir(t, "generate-job-")
|
2024-01-17 14:26:33 +00:00
|
|
|
f, err := filer.NewWorkspaceFilesClient(w, tmpdir)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
err = f.Write(ctx, "test.py", strings.NewReader("# Databricks notebook source\nprint('Hello world!'))"))
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
resp, err := w.Jobs.Create(ctx, jobs.CreateJob{
|
2024-12-12 12:35:38 +00:00
|
|
|
Name: testutil.RandomName("generated-job-"),
|
2024-01-17 14:26:33 +00:00
|
|
|
Tasks: []jobs.Task{
|
|
|
|
{
|
|
|
|
TaskKey: "test",
|
|
|
|
NewCluster: &compute.ClusterSpec{
|
|
|
|
SparkVersion: "13.3.x-scala2.12",
|
|
|
|
NumWorkers: 1,
|
2024-12-12 21:28:04 +00:00
|
|
|
NodeTypeId: testutil.GetCloud(t).NodeTypeID(),
|
2024-02-15 15:03:19 +00:00
|
|
|
SparkConf: map[string]string{
|
|
|
|
"spark.databricks.enableWsfs": "true",
|
|
|
|
"spark.databricks.hive.metastore.glueCatalog.enabled": "true",
|
|
|
|
"spark.databricks.pip.ignoreSSL": "true",
|
|
|
|
},
|
2024-01-17 14:26:33 +00:00
|
|
|
},
|
|
|
|
NotebookTask: &jobs.NotebookTask{
|
|
|
|
NotebookPath: path.Join(tmpdir, "test"),
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
return resp.JobId
|
|
|
|
}
|
|
|
|
|
2024-02-07 11:18:56 +00:00
|
|
|
func (gt *generateJobTest) destroyJob(ctx context.Context, jobId int64) {
|
|
|
|
err := gt.w.Jobs.Delete(ctx, jobs.DeleteJob{
|
2024-01-17 14:26:33 +00:00
|
|
|
JobId: jobId,
|
|
|
|
})
|
2024-02-07 11:18:56 +00:00
|
|
|
require.NoError(gt.T, err)
|
2024-01-17 14:26:33 +00:00
|
|
|
}
|