2022-05-13 13:30:22 +00:00
|
|
|
package project
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"fmt"
|
2022-10-19 14:22:55 +00:00
|
|
|
"os"
|
|
|
|
"path/filepath"
|
2022-05-14 17:55:00 +00:00
|
|
|
"sync"
|
2022-05-13 13:30:22 +00:00
|
|
|
|
2022-10-19 14:22:55 +00:00
|
|
|
"github.com/databricks/bricks/git"
|
2022-11-24 20:41:57 +00:00
|
|
|
"github.com/databricks/databricks-sdk-go"
|
2022-09-07 09:55:59 +00:00
|
|
|
"github.com/databricks/databricks-sdk-go/service/commands"
|
2022-09-08 13:50:00 +00:00
|
|
|
"github.com/databricks/databricks-sdk-go/service/scim"
|
2022-09-16 09:06:58 +00:00
|
|
|
"github.com/spf13/cobra"
|
2022-05-13 13:30:22 +00:00
|
|
|
)
|
|
|
|
|
2022-10-19 14:22:55 +00:00
|
|
|
const CacheDirName = ".databricks"
|
|
|
|
|
2022-09-16 09:06:58 +00:00
|
|
|
type project struct {
|
|
|
|
mu sync.Mutex
|
2022-05-14 17:55:00 +00:00
|
|
|
|
2022-09-16 13:18:46 +00:00
|
|
|
root string
|
2022-09-22 11:40:11 +00:00
|
|
|
env string
|
2022-09-16 13:18:46 +00:00
|
|
|
|
2022-09-22 11:40:11 +00:00
|
|
|
config *Config
|
|
|
|
environment *Environment
|
2022-11-24 20:41:57 +00:00
|
|
|
wsc *databricks.WorkspaceClient
|
2022-09-22 11:40:11 +00:00
|
|
|
me *scim.User
|
2022-10-19 14:22:55 +00:00
|
|
|
fileSet *git.FileSet
|
2022-09-16 09:06:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Configure is used as a PreRunE function for all commands that
|
|
|
|
// require a project to be configured. If a project could successfully
|
|
|
|
// be found and loaded, it is set on the command's context object.
|
|
|
|
func Configure(cmd *cobra.Command, args []string) error {
|
|
|
|
root, err := getRoot()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2022-05-14 17:55:00 +00:00
|
|
|
|
2022-09-22 11:40:11 +00:00
|
|
|
ctx, err := Initialize(cmd.Context(), root, getEnvironment(cmd))
|
2022-09-16 09:06:58 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
cmd.SetContext(ctx)
|
|
|
|
return nil
|
2022-05-14 17:55:00 +00:00
|
|
|
}
|
|
|
|
|
2022-09-16 09:06:58 +00:00
|
|
|
// Placeholder to use as unique key in context.Context.
|
|
|
|
var projectKey int
|
|
|
|
|
2022-09-22 11:40:11 +00:00
|
|
|
// Initialize loads a project configuration given a root and environment.
|
2022-09-16 09:06:58 +00:00
|
|
|
// It stores the project on a new context.
|
|
|
|
// The project is available through the `Get()` function.
|
2022-09-22 11:40:11 +00:00
|
|
|
func Initialize(ctx context.Context, root, env string) (context.Context, error) {
|
2022-09-16 09:06:58 +00:00
|
|
|
config, err := loadProjectConf(root)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2022-09-22 11:40:11 +00:00
|
|
|
// Confirm that the specified environment is valid.
|
|
|
|
environment, ok := config.Environments[env]
|
|
|
|
if !ok {
|
|
|
|
return nil, fmt.Errorf("environment [%s] not defined", env)
|
2022-09-16 09:06:58 +00:00
|
|
|
}
|
|
|
|
|
2022-11-03 20:09:29 +00:00
|
|
|
fileSet := git.NewFileSet(root)
|
2022-11-08 12:51:08 +00:00
|
|
|
err = fileSet.EnsureValidGitIgnoreExists()
|
|
|
|
if err != nil {
|
|
|
|
return ctx, nil
|
|
|
|
}
|
2022-10-19 14:22:55 +00:00
|
|
|
|
2022-09-22 11:40:11 +00:00
|
|
|
p := project{
|
|
|
|
root: root,
|
|
|
|
env: env,
|
|
|
|
|
|
|
|
config: &config,
|
|
|
|
environment: &environment,
|
2022-11-08 12:51:08 +00:00
|
|
|
fileSet: fileSet,
|
2022-09-21 11:55:37 +00:00
|
|
|
}
|
|
|
|
|
2022-09-22 11:40:11 +00:00
|
|
|
p.initializeWorkspacesClient(ctx)
|
2022-09-16 09:06:58 +00:00
|
|
|
return context.WithValue(ctx, &projectKey, &p), nil
|
2022-05-14 17:55:00 +00:00
|
|
|
}
|
|
|
|
|
2022-09-22 11:40:11 +00:00
|
|
|
func (p *project) initializeWorkspacesClient(ctx context.Context) {
|
|
|
|
var config databricks.Config
|
|
|
|
|
|
|
|
// If the config specifies a profile, or other authentication related properties,
|
|
|
|
// pass them along to the SDK here. If nothing is defined, the SDK will figure
|
|
|
|
// out which autentication mechanism to use using enviroment variables.
|
|
|
|
if p.environment.Workspace.Profile != "" {
|
|
|
|
config.Profile = p.environment.Workspace.Profile
|
|
|
|
}
|
|
|
|
|
2022-11-24 20:41:57 +00:00
|
|
|
p.wsc = databricks.Must(databricks.NewWorkspaceClient(&config))
|
2022-09-22 11:40:11 +00:00
|
|
|
}
|
|
|
|
|
2022-09-16 09:06:58 +00:00
|
|
|
// Get returns the project as configured on the context.
|
|
|
|
// It panics if it isn't configured.
|
|
|
|
func Get(ctx context.Context) *project {
|
|
|
|
project, ok := ctx.Value(&projectKey).(*project)
|
|
|
|
if !ok {
|
|
|
|
panic(`context not configured with project`)
|
|
|
|
}
|
|
|
|
return project
|
2022-05-13 13:30:22 +00:00
|
|
|
}
|
|
|
|
|
2022-09-07 09:55:59 +00:00
|
|
|
// Make sure to initialize the workspaces client on project init
|
2022-11-24 20:41:57 +00:00
|
|
|
func (p *project) WorkspacesClient() *databricks.WorkspaceClient {
|
2022-09-16 09:06:58 +00:00
|
|
|
return p.wsc
|
2022-09-07 09:55:59 +00:00
|
|
|
}
|
|
|
|
|
2022-09-16 13:18:46 +00:00
|
|
|
func (p *project) Root() string {
|
|
|
|
return p.root
|
|
|
|
}
|
|
|
|
|
2022-10-19 14:22:55 +00:00
|
|
|
func (p *project) GetFileSet() *git.FileSet {
|
|
|
|
return p.fileSet
|
|
|
|
}
|
|
|
|
|
|
|
|
// This cache dir will contain any state, state overrides (per user overrides
|
|
|
|
// to the project config) or any generated artifacts (eg: sync snapshots)
|
|
|
|
// that should never be checked into Git.
|
|
|
|
//
|
|
|
|
// We enfore that cache dir (.databricks) is added to .gitignore
|
|
|
|
// because it contains per-user overrides that we do not want users to
|
|
|
|
// accidentally check into git
|
|
|
|
func (p *project) CacheDir() (string, error) {
|
|
|
|
// assert cache dir is present in git ignore
|
|
|
|
if !p.fileSet.IsGitIgnored(fmt.Sprintf("/%s/", CacheDirName)) {
|
|
|
|
return "", fmt.Errorf("please add /%s/ to .gitignore", CacheDirName)
|
|
|
|
}
|
|
|
|
|
|
|
|
cacheDirPath := filepath.Join(p.root, CacheDirName)
|
|
|
|
// create cache dir if it does not exist
|
|
|
|
if _, err := os.Stat(cacheDirPath); os.IsNotExist(err) {
|
|
|
|
err = os.Mkdir(cacheDirPath, os.ModeDir|os.ModePerm)
|
|
|
|
if err != nil {
|
|
|
|
return "", fmt.Errorf("failed to create cache directory %s with error: %s", cacheDirPath, err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return cacheDirPath, nil
|
|
|
|
}
|
|
|
|
|
2022-09-22 11:40:11 +00:00
|
|
|
func (p *project) Config() Config {
|
|
|
|
return *p.config
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *project) Environment() Environment {
|
|
|
|
return *p.environment
|
|
|
|
}
|
|
|
|
|
2022-09-16 09:06:58 +00:00
|
|
|
func (p *project) Me() (*scim.User, error) {
|
|
|
|
p.mu.Lock()
|
|
|
|
defer p.mu.Unlock()
|
|
|
|
if p.me != nil {
|
|
|
|
return p.me, nil
|
2022-05-14 17:55:00 +00:00
|
|
|
}
|
2022-09-16 09:06:58 +00:00
|
|
|
me, err := p.wsc.CurrentUser.Me(context.Background())
|
2022-05-13 13:30:22 +00:00
|
|
|
if err != nil {
|
2022-09-14 15:50:29 +00:00
|
|
|
return nil, err
|
2022-05-14 17:55:00 +00:00
|
|
|
}
|
2022-09-16 09:06:58 +00:00
|
|
|
p.me = me
|
2022-09-14 15:50:29 +00:00
|
|
|
return me, nil
|
2022-05-14 17:55:00 +00:00
|
|
|
}
|
|
|
|
|
2022-09-16 09:06:58 +00:00
|
|
|
func (p *project) DeploymentIsolationPrefix() string {
|
|
|
|
if p.config.Isolation == None {
|
|
|
|
return p.config.Name
|
2022-05-21 13:23:37 +00:00
|
|
|
}
|
2022-09-16 09:06:58 +00:00
|
|
|
if p.config.Isolation == Soft {
|
|
|
|
me, err := p.Me()
|
2022-09-14 15:50:29 +00:00
|
|
|
if err != nil {
|
|
|
|
panic(err)
|
|
|
|
}
|
2022-09-16 09:06:58 +00:00
|
|
|
return fmt.Sprintf("%s/%s", p.config.Name, me.UserName)
|
2022-05-21 13:23:37 +00:00
|
|
|
}
|
2022-09-16 09:06:58 +00:00
|
|
|
panic(fmt.Errorf("unknow project isolation: %s", p.config.Isolation))
|
2022-05-21 13:23:37 +00:00
|
|
|
}
|
|
|
|
|
2022-09-07 09:55:59 +00:00
|
|
|
func getClusterIdFromClusterName(ctx context.Context,
|
2022-11-24 20:41:57 +00:00
|
|
|
wsc *databricks.WorkspaceClient,
|
2022-09-07 09:55:59 +00:00
|
|
|
clusterName string,
|
|
|
|
) (clusterId string, err error) {
|
2022-12-01 11:17:36 +00:00
|
|
|
clusterInfo, err := wsc.Clusters.GetByClusterName(ctx, clusterName)
|
2022-09-07 09:55:59 +00:00
|
|
|
if err != nil {
|
2022-11-24 20:41:57 +00:00
|
|
|
return "", err
|
2022-09-07 09:55:59 +00:00
|
|
|
}
|
2022-11-24 20:41:57 +00:00
|
|
|
return clusterInfo.ClusterId, nil
|
2022-09-07 09:55:59 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Old version of getting development cluster details with isolation implemented.
|
|
|
|
// Kept just for reference. Remove once isolation is implemented properly
|
|
|
|
/*
|
2022-09-16 09:06:58 +00:00
|
|
|
func (p *project) DevelopmentCluster(ctx context.Context) (cluster clusters.ClusterInfo, err error) {
|
|
|
|
api := clusters.NewClustersAPI(ctx, p.Client()) // TODO: rewrite with normal SDK
|
|
|
|
if p.project.DevCluster == nil {
|
|
|
|
p.project.DevCluster = &clusters.Cluster{}
|
|
|
|
}
|
|
|
|
dc := p.project.DevCluster
|
|
|
|
if p.project.Isolation == Soft {
|
|
|
|
if p.project.IsDevClusterJustReference() {
|
2022-05-14 17:55:00 +00:00
|
|
|
err = fmt.Errorf("projects with soft isolation cannot have named clusters")
|
|
|
|
return
|
|
|
|
}
|
2022-09-16 09:06:58 +00:00
|
|
|
dc.ClusterName = fmt.Sprintf("dev/%s", p.DeploymentIsolationPrefix())
|
2022-05-14 17:55:00 +00:00
|
|
|
}
|
|
|
|
if dc.ClusterName == "" {
|
|
|
|
err = fmt.Errorf("please either pick `isolation: soft` or specify a shared cluster name")
|
2022-05-13 13:30:22 +00:00
|
|
|
return
|
|
|
|
}
|
2022-09-16 09:06:58 +00:00
|
|
|
return app.GetOrCreateRunningCluster(dc.ClusterName, *dc)
|
2022-05-13 13:30:22 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func runCommandOnDev(ctx context.Context, language, command string) common.CommandResults {
|
2022-05-14 17:55:00 +00:00
|
|
|
cluster, err := Current.DevelopmentCluster(ctx)
|
|
|
|
exec := Current.Client().CommandExecutor(ctx)
|
2022-05-13 13:30:22 +00:00
|
|
|
if err != nil {
|
|
|
|
return common.CommandResults{
|
|
|
|
ResultType: "error",
|
2022-05-14 17:55:00 +00:00
|
|
|
Summary: err.Error(),
|
2022-05-13 13:30:22 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return exec.Execute(cluster.ClusterID, language, command)
|
|
|
|
}
|
|
|
|
|
|
|
|
func RunPythonOnDev(ctx context.Context, command string) common.CommandResults {
|
|
|
|
return runCommandOnDev(ctx, "python", command)
|
2022-05-14 17:55:00 +00:00
|
|
|
}
|
2022-09-07 09:55:59 +00:00
|
|
|
*/
|
|
|
|
|
2022-09-16 09:06:58 +00:00
|
|
|
// TODO: Add safe access to p.project and p.project.DevCluster that throws errors if
|
2022-09-07 09:55:59 +00:00
|
|
|
// the fields are not defined properly
|
2022-09-16 09:06:58 +00:00
|
|
|
func (p *project) GetDevelopmentClusterId(ctx context.Context) (clusterId string, err error) {
|
|
|
|
clusterId = p.config.DevCluster.ClusterId
|
|
|
|
clusterName := p.config.DevCluster.ClusterName
|
2022-09-07 09:55:59 +00:00
|
|
|
if clusterId != "" {
|
|
|
|
return
|
|
|
|
} else if clusterName != "" {
|
|
|
|
// Add workspaces client on init
|
2022-09-16 09:06:58 +00:00
|
|
|
return getClusterIdFromClusterName(ctx, p.wsc, clusterName)
|
2022-09-07 09:55:59 +00:00
|
|
|
} else {
|
|
|
|
// TODO: Add the project config file location used to error message
|
|
|
|
err = fmt.Errorf("please define either development cluster's cluster_id or cluster_name in your project config")
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-27 16:58:55 +00:00
|
|
|
func runCommandOnDev(ctx context.Context, language, command string) commands.Results {
|
2022-09-16 09:06:58 +00:00
|
|
|
clusterId, err := Get(ctx).GetDevelopmentClusterId(ctx)
|
2022-09-07 09:55:59 +00:00
|
|
|
if err != nil {
|
2022-09-27 16:58:55 +00:00
|
|
|
return commands.Results{
|
2022-09-07 09:55:59 +00:00
|
|
|
ResultType: "error",
|
|
|
|
Summary: err.Error(),
|
|
|
|
}
|
|
|
|
}
|
2022-09-27 16:58:55 +00:00
|
|
|
return Get(ctx).wsc.CommandExecutor.Execute(ctx, clusterId, language, command)
|
2022-09-07 09:55:59 +00:00
|
|
|
}
|
|
|
|
|
2022-09-27 16:58:55 +00:00
|
|
|
func RunPythonOnDev(ctx context.Context, command string) commands.Results {
|
2022-09-07 09:55:59 +00:00
|
|
|
return runCommandOnDev(ctx, "python", command)
|
|
|
|
}
|