mirror of https://github.com/databricks/cli.git
119 lines
2.8 KiB
Go
119 lines
2.8 KiB
Go
package python
|
|
|
|
import (
|
|
"fmt"
|
|
"strconv"
|
|
"strings"
|
|
|
|
"github.com/databricks/cli/bundle"
|
|
"github.com/databricks/cli/bundle/config/mutator"
|
|
"github.com/databricks/cli/bundle/libraries"
|
|
"github.com/databricks/databricks-sdk-go/service/jobs"
|
|
)
|
|
|
|
const NOTEBOOK_TEMPLATE = `# Databricks notebook source
|
|
%python
|
|
{{range .Libraries}}
|
|
%pip install --force-reinstall {{.Whl}}
|
|
{{end}}
|
|
|
|
dbutils.library.restartPython()
|
|
|
|
try:
|
|
from importlib import metadata
|
|
except ImportError: # for Python<3.8
|
|
import subprocess
|
|
import sys
|
|
|
|
subprocess.check_call([sys.executable, "-m", "pip", "install", "importlib-metadata"])
|
|
import importlib_metadata as metadata
|
|
|
|
from contextlib import redirect_stdout
|
|
import io
|
|
import sys
|
|
sys.argv = [{{.Params}}]
|
|
|
|
entry = [ep for ep in metadata.distribution("{{.Task.PackageName}}").entry_points if ep.name == "{{.Task.EntryPoint}}"]
|
|
|
|
f = io.StringIO()
|
|
with redirect_stdout(f):
|
|
if entry:
|
|
entry[0].load()()
|
|
else:
|
|
raise ImportError("Entry point '{{.Task.EntryPoint}}' not found")
|
|
s = f.getvalue()
|
|
dbutils.notebook.exit(s)
|
|
`
|
|
|
|
// This mutator takes the wheel task and transforms it into notebook
|
|
// which installs uploaded wheels using %pip and then calling corresponding
|
|
// entry point.
|
|
func TransformWheelTask() bundle.Mutator {
|
|
return mutator.NewTrampoline(
|
|
"python_wheel",
|
|
&pythonTrampoline{},
|
|
NOTEBOOK_TEMPLATE,
|
|
)
|
|
}
|
|
|
|
type pythonTrampoline struct{}
|
|
|
|
func (t *pythonTrampoline) CleanUp(task *jobs.Task) error {
|
|
task.PythonWheelTask = nil
|
|
task.Libraries = nil
|
|
|
|
return nil
|
|
}
|
|
|
|
func (t *pythonTrampoline) GetTasks(b *bundle.Bundle) []mutator.TaskWithJobKey {
|
|
r := b.Config.Resources
|
|
result := make([]mutator.TaskWithJobKey, 0)
|
|
for k := range b.Config.Resources.Jobs {
|
|
tasks := r.Jobs[k].JobSettings.Tasks
|
|
for i := range tasks {
|
|
task := &tasks[i]
|
|
|
|
// Keep only Python wheel tasks with local libraries referenced
|
|
if task.PythonWheelTask == nil || !libraries.IsTaskWithLocalLibraries(task) {
|
|
continue
|
|
}
|
|
|
|
result = append(result, mutator.TaskWithJobKey{
|
|
JobKey: k,
|
|
Task: task,
|
|
})
|
|
}
|
|
}
|
|
return result
|
|
}
|
|
|
|
func (t *pythonTrampoline) GetTemplateData(task *jobs.Task) (map[string]any, error) {
|
|
params, err := t.generateParameters(task.PythonWheelTask)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
data := map[string]any{
|
|
"Libraries": task.Libraries,
|
|
"Params": params,
|
|
"Task": task.PythonWheelTask,
|
|
}
|
|
|
|
return data, nil
|
|
}
|
|
|
|
func (t *pythonTrampoline) generateParameters(task *jobs.PythonWheelTask) (string, error) {
|
|
if task.Parameters != nil && task.NamedParameters != nil {
|
|
return "", fmt.Errorf("not allowed to pass both paramaters and named_parameters")
|
|
}
|
|
params := append([]string{"python"}, task.Parameters...)
|
|
for k, v := range task.NamedParameters {
|
|
params = append(params, fmt.Sprintf("%s=%s", k, v))
|
|
}
|
|
|
|
for i := range params {
|
|
params[i] = strconv.Quote(params[i])
|
|
}
|
|
return strings.Join(params, ", "), nil
|
|
}
|