2024-10-15 13:22:41 +00:00
package libraries
import (
"context"
"fmt"
"path"
"strings"
"github.com/databricks/cli/bundle"
"github.com/databricks/cli/libs/diag"
"github.com/databricks/cli/libs/dyn"
"github.com/databricks/cli/libs/dyn/dynvar"
"github.com/databricks/cli/libs/filer"
)
2024-11-29 01:45:33 +00:00
func extractVolumeFromPath ( artifactPath string ) ( string , string , string , error ) {
if ! IsVolumesPath ( artifactPath ) {
return "" , "" , "" , fmt . Errorf ( "expected artifact_path to start with /Volumes/, got %s" , artifactPath )
}
parts := strings . Split ( artifactPath , "/" )
volumeFormatErr := fmt . Errorf ( "expected UC volume path to be in the format /Volumes/<catalog>/<schema>/<volume>/..., got %s" , artifactPath )
// Incorrect format.
if len ( parts ) < 5 {
return "" , "" , "" , volumeFormatErr
}
catalogName := parts [ 2 ]
schemaName := parts [ 3 ]
volumeName := parts [ 4 ]
// Incorrect format.
if catalogName == "" || schemaName == "" || volumeName == "" {
return "" , "" , "" , volumeFormatErr
}
return catalogName , schemaName , volumeName , nil
}
2024-10-15 13:22:41 +00:00
// This function returns a filer for ".internal" folder inside the directory configured
// at `workspace.artifact_path`.
// This function also checks if the UC volume exists in the workspace and then:
// 1. If the UC volume exists in the workspace:
// Returns a filer for the UC volume.
// 2. If the UC volume does not exist in the workspace but is (with high confidence) defined in
// the bundle configuration:
// Returns an error and a warning that instructs the user to deploy the
// UC volume before using it in the artifact path.
// 3. If the UC volume does not exist in the workspace and is not defined in the bundle configuration:
// Returns an error.
func filerForVolume ( ctx context . Context , b * bundle . Bundle ) ( filer . Filer , string , diag . Diagnostics ) {
artifactPath := b . Config . Workspace . ArtifactPath
w := b . WorkspaceClient ( )
2024-11-29 01:31:33 +00:00
if ! IsVolumesPath ( artifactPath ) {
2024-10-15 13:27:58 +00:00
return nil , "" , diag . Errorf ( "expected artifact_path to start with /Volumes/, got %s" , artifactPath )
}
2024-11-29 01:45:33 +00:00
catalogName , schemaName , volumeName , err := extractVolumeFromPath ( artifactPath )
if err != nil {
return nil , "" , diag . Diagnostics {
{
Severity : diag . Error ,
Summary : err . Error ( ) ,
Locations : b . Config . GetLocations ( "workspace.artifact_path" ) ,
Paths : [ ] dyn . Path { dyn . MustPathFromString ( "workspace.artifact_path" ) } ,
} ,
}
2024-10-15 13:22:41 +00:00
}
// Check if the UC volume exists in the workspace.
volumePath := fmt . Sprintf ( "/Volumes/%s/%s/%s" , catalogName , schemaName , volumeName )
2024-11-29 01:45:33 +00:00
err = w . Files . GetDirectoryMetadataByDirectoryPath ( ctx , volumePath )
2024-10-15 13:22:41 +00:00
// If the volume exists already, directly return the filer for the path to
// upload the artifacts to.
if err == nil {
uploadPath := path . Join ( artifactPath , ".internal" )
f , err := filer . NewFilesClient ( w , uploadPath )
return f , uploadPath , diag . FromErr ( err )
}
diags := diag . Errorf ( "failed to fetch metadata for the UC volume %s that is configured in the artifact_path: %s" , volumePath , err )
path , locations , ok := findVolumeInBundle ( b , catalogName , schemaName , volumeName )
if ! ok {
return nil , "" , diags
}
warning := diag . Diagnostic {
Severity : diag . Warning ,
Summary : ` You might be using a UC volume in your artifact_path that is managed by this bundle but which has not been deployed yet. Please deploy the UC volume in a separate bundle deploy before using it in the artifact_path. ` ,
Locations : locations ,
Paths : [ ] dyn . Path { path } ,
}
return nil , "" , diags . Append ( warning )
}
func findVolumeInBundle ( b * bundle . Bundle , catalogName , schemaName , volumeName string ) ( dyn . Path , [ ] dyn . Location , bool ) {
volumes := b . Config . Resources . Volumes
for k , v := range volumes {
if v . CatalogName != catalogName || v . Name != volumeName {
continue
}
// UC schemas can be defined in the bundle itself, and thus might be interpolated
// at runtime via the ${resources.schemas.<name>} syntax. Thus we match the volume
// definition if the schema name is the same as the one in the bundle, or if the
// schema name is interpolated.
2024-10-15 16:04:20 +00:00
// We only have to check for ${resources.schemas...} references because any
// other valid reference (like ${var.foo}) would have been interpolated by this point.
p , ok := dynvar . PureReferenceToPath ( v . SchemaName )
isSchemaDefinedInBundle := ok && p . HasPrefix ( dyn . Path { dyn . Key ( "resources" ) , dyn . Key ( "schemas" ) } )
if v . SchemaName != schemaName && ! isSchemaDefinedInBundle {
2024-10-15 13:22:41 +00:00
continue
}
pathString := fmt . Sprintf ( "resources.volumes.%s" , k )
return dyn . MustPathFromString ( pathString ) , b . Config . GetLocations ( pathString ) , true
}
return nil , nil , false
}