2024-01-17 14:26:33 +00:00
|
|
|
package generate
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"fmt"
|
|
|
|
"io"
|
|
|
|
"os"
|
|
|
|
"path"
|
|
|
|
"path/filepath"
|
|
|
|
|
|
|
|
"github.com/databricks/cli/libs/cmdio"
|
|
|
|
"github.com/databricks/cli/libs/notebook"
|
|
|
|
"github.com/databricks/databricks-sdk-go"
|
|
|
|
"github.com/databricks/databricks-sdk-go/service/jobs"
|
2024-01-25 11:35:14 +00:00
|
|
|
"github.com/databricks/databricks-sdk-go/service/pipelines"
|
2025-01-13 16:43:48 +00:00
|
|
|
"github.com/databricks/databricks-sdk-go/service/workspace"
|
2024-01-17 14:26:33 +00:00
|
|
|
"golang.org/x/sync/errgroup"
|
|
|
|
)
|
|
|
|
|
2024-01-25 11:35:14 +00:00
|
|
|
type downloader struct {
|
|
|
|
files map[string]string
|
2024-01-17 14:26:33 +00:00
|
|
|
w *databricks.WorkspaceClient
|
|
|
|
sourceDir string
|
|
|
|
configDir string
|
|
|
|
}
|
|
|
|
|
2024-01-25 11:35:14 +00:00
|
|
|
func (n *downloader) MarkTaskForDownload(ctx context.Context, task *jobs.Task) error {
|
2024-01-17 14:26:33 +00:00
|
|
|
if task.NotebookTask == nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2024-01-25 11:35:14 +00:00
|
|
|
return n.markNotebookForDownload(ctx, &task.NotebookTask.NotebookPath)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (n *downloader) MarkPipelineLibraryForDownload(ctx context.Context, lib *pipelines.PipelineLibrary) error {
|
|
|
|
if lib.Notebook != nil {
|
|
|
|
return n.markNotebookForDownload(ctx, &lib.Notebook.Path)
|
|
|
|
}
|
|
|
|
|
|
|
|
if lib.File != nil {
|
|
|
|
return n.markFileForDownload(ctx, &lib.File.Path)
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (n *downloader) markFileForDownload(ctx context.Context, filePath *string) error {
|
|
|
|
_, err := n.w.Workspace.GetStatusByPath(ctx, *filePath)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
filename := path.Base(*filePath)
|
|
|
|
targetPath := filepath.Join(n.sourceDir, filename)
|
|
|
|
|
|
|
|
n.files[targetPath] = *filePath
|
|
|
|
|
|
|
|
rel, err := filepath.Rel(n.configDir, targetPath)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
*filePath = rel
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2025-01-13 16:43:48 +00:00
|
|
|
func (n *downloader) markDirectoryForDownload(ctx context.Context, dirPath *string) error {
|
|
|
|
_, err := n.w.Workspace.GetStatusByPath(ctx, *dirPath)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
objects, err := n.w.Workspace.RecursiveList(ctx, *dirPath)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, obj := range objects {
|
|
|
|
if obj.ObjectType == workspace.ObjectTypeDirectory {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
err := n.markFileForDownload(ctx, &obj.Path)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
rel, err := filepath.Rel(n.configDir, n.sourceDir)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
*dirPath = rel
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2024-01-25 11:35:14 +00:00
|
|
|
func (n *downloader) markNotebookForDownload(ctx context.Context, notebookPath *string) error {
|
|
|
|
info, err := n.w.Workspace.GetStatusByPath(ctx, *notebookPath)
|
2024-01-17 14:26:33 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
ext := notebook.GetExtensionByLanguage(info)
|
|
|
|
|
2024-01-25 11:35:14 +00:00
|
|
|
filename := path.Base(*notebookPath) + ext
|
2024-01-17 14:26:33 +00:00
|
|
|
targetPath := filepath.Join(n.sourceDir, filename)
|
|
|
|
|
2024-01-25 11:35:14 +00:00
|
|
|
n.files[targetPath] = *notebookPath
|
2024-01-17 14:26:33 +00:00
|
|
|
|
|
|
|
// Update the notebook path to be relative to the config dir
|
|
|
|
rel, err := filepath.Rel(n.configDir, targetPath)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2024-01-25 11:35:14 +00:00
|
|
|
*notebookPath = rel
|
2024-01-17 14:26:33 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2024-01-25 11:35:14 +00:00
|
|
|
func (n *downloader) FlushToDisk(ctx context.Context, force bool) error {
|
2024-01-17 14:26:33 +00:00
|
|
|
err := os.MkdirAll(n.sourceDir, 0o755)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
// First check that all files can be written
|
2024-01-25 11:35:14 +00:00
|
|
|
for targetPath := range n.files {
|
2024-01-17 14:26:33 +00:00
|
|
|
info, err := os.Stat(targetPath)
|
|
|
|
if err == nil {
|
|
|
|
if info.IsDir() {
|
|
|
|
return fmt.Errorf("%s is a directory", targetPath)
|
|
|
|
}
|
|
|
|
if !force {
|
|
|
|
return fmt.Errorf("%s already exists. Use --force to overwrite", targetPath)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
errs, errCtx := errgroup.WithContext(ctx)
|
2024-01-25 11:35:14 +00:00
|
|
|
for k, v := range n.files {
|
2024-01-17 14:26:33 +00:00
|
|
|
targetPath := k
|
2024-01-25 11:35:14 +00:00
|
|
|
filePath := v
|
2024-01-17 14:26:33 +00:00
|
|
|
errs.Go(func() error {
|
2024-01-25 11:35:14 +00:00
|
|
|
reader, err := n.w.Workspace.Download(errCtx, filePath)
|
2024-01-17 14:26:33 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
file, err := os.Create(targetPath)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer file.Close()
|
|
|
|
|
|
|
|
_, err = io.Copy(file, reader)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2025-01-07 10:49:23 +00:00
|
|
|
cmdio.LogString(errCtx, "File successfully saved to "+targetPath)
|
2024-01-17 14:26:33 +00:00
|
|
|
return reader.Close()
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
return errs.Wait()
|
|
|
|
}
|
|
|
|
|
2024-01-25 11:35:14 +00:00
|
|
|
func newDownloader(w *databricks.WorkspaceClient, sourceDir, configDir string) *downloader {
|
|
|
|
return &downloader{
|
|
|
|
files: make(map[string]string),
|
2024-01-17 14:26:33 +00:00
|
|
|
w: w,
|
|
|
|
sourceDir: sourceDir,
|
|
|
|
configDir: configDir,
|
|
|
|
}
|
|
|
|
}
|