databricks-cli/bundle/run/job_options.go

package run

import (
	"fmt"
	"strconv"

	"github.com/databricks/cli/bundle/config/resources"
	"github.com/databricks/databricks-sdk-go/service/jobs"
	flag "github.com/spf13/pflag"
)

// JobOptions defines options for running a job.
type JobOptions struct {
	// Task parameters are specific to the type of task.
	dbtCommands       []string
	jarParams         []string
	notebookParams    map[string]string
	pipelineParams    map[string]string
	pythonNamedParams map[string]string
	pythonParams      []string
	sparkSubmitParams []string
	sqlParams         map[string]string

	// Job parameters are a map of key-value pairs that are passed to the job.
	// If a job uses job parameters, it cannot use task parameters.
	// Also see https://docs.databricks.com/en/workflows/jobs/settings.html#add-parameters-for-all-job-tasks.
	jobParams map[string]string
}

func (o *JobOptions) DefineJobOptions(fs *flag.FlagSet) {
	fs.StringToStringVar(&o.jobParams, "params", nil, "comma separated k=v pairs for job parameters")
}

func (o *JobOptions) DefineTaskOptions(fs *flag.FlagSet) {
	fs.StringSliceVar(&o.dbtCommands, "dbt-commands", nil, "A list of commands to execute for jobs with DBT tasks.")
	fs.StringSliceVar(&o.jarParams, "jar-params", nil, "A list of parameters for jobs with Spark JAR tasks.")
	fs.StringToStringVar(&o.notebookParams, "notebook-params", nil, "A map from keys to values for jobs with notebook tasks.")
	fs.StringToStringVar(&o.pipelineParams, "pipeline-params", nil, "A map from keys to values for jobs with pipeline tasks.")
	fs.StringToStringVar(&o.pythonNamedParams, "python-named-params", nil, "A map from keys to values for jobs with Python wheel tasks.")
	fs.StringSliceVar(&o.pythonParams, "python-params", nil, "A list of parameters for jobs with Python tasks.")
	fs.StringSliceVar(&o.sparkSubmitParams, "spark-submit-params", nil, "A list of parameters for jobs with Spark submit tasks.")
	fs.StringToStringVar(&o.sqlParams, "sql-params", nil, "A map from keys to values for jobs with SQL tasks.")
}

func (o *JobOptions) hasTaskParametersConfigured() bool {
	return len(o.dbtCommands) > 0 ||
		len(o.jarParams) > 0 ||
		len(o.notebookParams) > 0 ||
		len(o.pipelineParams) > 0 ||
		len(o.pythonNamedParams) > 0 ||
		len(o.pythonParams) > 0 ||
		len(o.sparkSubmitParams) > 0 ||
		len(o.sqlParams) > 0
}

func (o *JobOptions) hasJobParametersConfigured() bool {
	return len(o.jobParams) > 0
}

// Validate returns if the combination of options is valid.
func (o *JobOptions) Validate(job *resources.Job) error {
	if job == nil {
		return fmt.Errorf("job not defined")
	}

	// Ensure mutual exclusion on job parameters and task parameters.
	hasJobParams := len(job.Parameters) > 0
	if hasJobParams && o.hasTaskParametersConfigured() {
		return fmt.Errorf("the job to run defines job parameters; specifying task parameters is not allowed")
	}
	if !hasJobParams && o.hasJobParametersConfigured() {
		return fmt.Errorf("the job to run does not define job parameters; specifying job parameters is not allowed")
	}

	return nil
}

func (o *JobOptions) validatePipelineParams() (*jobs.PipelineParams, error) {
	if len(o.pipelineParams) == 0 {
		return nil, nil
	}

	var defaultErr = fmt.Errorf("job run argument --pipeline-params only supports `full_refresh=<bool>`")
	v, ok := o.pipelineParams["full_refresh"]
	if !ok {
		return nil, defaultErr
	}

	b, err := strconv.ParseBool(v)
	if err != nil {
		return nil, defaultErr
	}

	pipelineParams := &jobs.PipelineParams{
		FullRefresh: b,
	}

	return pipelineParams, nil
}

func (o *JobOptions) toPayload(job *resources.Job, jobID int64) (*jobs.RunNow, error) {
	if err := o.Validate(job); err != nil {
		return nil, err
	}

	pipelineParams, err := o.validatePipelineParams()
	if err != nil {
		return nil, err
	}

	payload := &jobs.RunNow{
		JobId: jobID,

		DbtCommands:       o.dbtCommands,
		JarParams:         o.jarParams,
		NotebookParams:    o.notebookParams,
		PipelineParams:    pipelineParams,
		PythonNamedParams: o.pythonNamedParams,
		PythonParams:      o.pythonParams,
		SparkSubmitParams: o.sparkSubmitParams,
		SqlParams:         o.sqlParams,

		JobParameters: o.jobParams,
	}

	return payload, nil
}
Support passing job parameters to bundle run (#1115) ## Changes This change adds support for job parameters. If job parameters are specified for a job that doesn't define job parameters it returns an error. Conversely, if task parameters are specified for a job that defines job parameters, it also returns an error. This change moves the options structs and their functions to separate files and backfills test coverage for them. Job parameters can now be specified with `--params foo=bar,bar=qux`. ## Tests Unit tests and manual integration testing. 2024-01-15 07:42:36 +00:00			`package run`

			`import (`
			`"fmt"`
			`"strconv"`

			`"github.com/databricks/cli/bundle/config/resources"`
			`"github.com/databricks/databricks-sdk-go/service/jobs"`
			`flag "github.com/spf13/pflag"`
			`)`

			`// JobOptions defines options for running a job.`
			`type JobOptions struct {`
			`// Task parameters are specific to the type of task.`
			`dbtCommands []string`
			`jarParams []string`
			`notebookParams map[string]string`
			`pipelineParams map[string]string`
			`pythonNamedParams map[string]string`
			`pythonParams []string`
			`sparkSubmitParams []string`
			`sqlParams map[string]string`

			`// Job parameters are a map of key-value pairs that are passed to the job.`
			`// If a job uses job parameters, it cannot use task parameters.`
			`// Also see https://docs.databricks.com/en/workflows/jobs/settings.html#add-parameters-for-all-job-tasks.`
			`jobParams map[string]string`
			`}`

Group bundle run flags by job and pipeline types (#1174) ## Changes Group bundle run flags by job and pipeline types ## Tests ``` Run a resource (e.g. a job or a pipeline) Usage: databricks bundle run [flags] KEY Job Flags: --dbt-commands strings A list of commands to execute for jobs with DBT tasks. --jar-params strings A list of parameters for jobs with Spark JAR tasks. --notebook-params stringToString A map from keys to values for jobs with notebook tasks. (default []) --params stringToString comma separated k=v pairs for job parameters (default []) --pipeline-params stringToString A map from keys to values for jobs with pipeline tasks. (default []) --python-named-params stringToString A map from keys to values for jobs with Python wheel tasks. (default []) --python-params strings A list of parameters for jobs with Python tasks. --spark-submit-params strings A list of parameters for jobs with Spark submit tasks. --sql-params stringToString A map from keys to values for jobs with SQL tasks. (default []) Pipeline Flags: --full-refresh strings List of tables to reset and recompute. --full-refresh-all Perform a full graph reset and recompute. --refresh strings List of tables to update. --refresh-all Perform a full graph update. Flags: -h, --help help for run --no-wait Don't wait for the run to complete. Global Flags: --debug enable debug logging -o, --output type output type: text or json (default text) -p, --profile string ~/.databrickscfg profile -t, --target string bundle target to use (if applicable) --var strings set values for variables defined in bundle config. Example: --var="foo=bar" ``` 2024-02-06 14:51:02 +00:00			`func (o JobOptions) DefineJobOptions(fs flag.FlagSet) {`
			`fs.StringToStringVar(&o.jobParams, "params", nil, "comma separated k=v pairs for job parameters")`
			`}`

			`func (o JobOptions) DefineTaskOptions(fs flag.FlagSet) {`
Support passing job parameters to bundle run (#1115) ## Changes This change adds support for job parameters. If job parameters are specified for a job that doesn't define job parameters it returns an error. Conversely, if task parameters are specified for a job that defines job parameters, it also returns an error. This change moves the options structs and their functions to separate files and backfills test coverage for them. Job parameters can now be specified with `--params foo=bar,bar=qux`. ## Tests Unit tests and manual integration testing. 2024-01-15 07:42:36 +00:00			`fs.StringSliceVar(&o.dbtCommands, "dbt-commands", nil, "A list of commands to execute for jobs with DBT tasks.")`
			`fs.StringSliceVar(&o.jarParams, "jar-params", nil, "A list of parameters for jobs with Spark JAR tasks.")`
			`fs.StringToStringVar(&o.notebookParams, "notebook-params", nil, "A map from keys to values for jobs with notebook tasks.")`
			`fs.StringToStringVar(&o.pipelineParams, "pipeline-params", nil, "A map from keys to values for jobs with pipeline tasks.")`
			`fs.StringToStringVar(&o.pythonNamedParams, "python-named-params", nil, "A map from keys to values for jobs with Python wheel tasks.")`
			`fs.StringSliceVar(&o.pythonParams, "python-params", nil, "A list of parameters for jobs with Python tasks.")`
			`fs.StringSliceVar(&o.sparkSubmitParams, "spark-submit-params", nil, "A list of parameters for jobs with Spark submit tasks.")`
			`fs.StringToStringVar(&o.sqlParams, "sql-params", nil, "A map from keys to values for jobs with SQL tasks.")`
			`}`

			`func (o *JobOptions) hasTaskParametersConfigured() bool {`
			`return len(o.dbtCommands) > 0 \|\|`
			`len(o.jarParams) > 0 \|\|`
			`len(o.notebookParams) > 0 \|\|`
			`len(o.pipelineParams) > 0 \|\|`
			`len(o.pythonNamedParams) > 0 \|\|`
			`len(o.pythonParams) > 0 \|\|`
			`len(o.sparkSubmitParams) > 0 \|\|`
			`len(o.sqlParams) > 0`
			`}`

			`func (o *JobOptions) hasJobParametersConfigured() bool {`
			`return len(o.jobParams) > 0`
			`}`

			`// Validate returns if the combination of options is valid.`
			`func (o JobOptions) Validate(job resources.Job) error {`
			`if job == nil {`
			`return fmt.Errorf("job not defined")`
			`}`

			`// Ensure mutual exclusion on job parameters and task parameters.`
			`hasJobParams := len(job.Parameters) > 0`
			`if hasJobParams && o.hasTaskParametersConfigured() {`
			`return fmt.Errorf("the job to run defines job parameters; specifying task parameters is not allowed")`
			`}`
			`if !hasJobParams && o.hasJobParametersConfigured() {`
			`return fmt.Errorf("the job to run does not define job parameters; specifying job parameters is not allowed")`
			`}`

			`return nil`
			`}`

			`func (o JobOptions) validatePipelineParams() (jobs.PipelineParams, error) {`
			`if len(o.pipelineParams) == 0 {`
			`return nil, nil`
			`}`

			var defaultErr = fmt.Errorf("job run argument --pipeline-params only supports `full_refresh=<bool>`")
			`v, ok := o.pipelineParams["full_refresh"]`
			`if !ok {`
			`return nil, defaultErr`
			`}`

			`b, err := strconv.ParseBool(v)`
			`if err != nil {`
			`return nil, defaultErr`
			`}`

			`pipelineParams := &jobs.PipelineParams{`
			`FullRefresh: b,`
			`}`

			`return pipelineParams, nil`
			`}`

			`func (o JobOptions) toPayload(job resources.Job, jobID int64) (*jobs.RunNow, error) {`
			`if err := o.Validate(job); err != nil {`
			`return nil, err`
			`}`

			`pipelineParams, err := o.validatePipelineParams()`
			`if err != nil {`
			`return nil, err`
			`}`

			`payload := &jobs.RunNow{`
			`JobId: jobID,`

			`DbtCommands: o.dbtCommands,`
			`JarParams: o.jarParams,`
			`NotebookParams: o.notebookParams,`
			`PipelineParams: pipelineParams,`
			`PythonNamedParams: o.pythonNamedParams,`
			`PythonParams: o.pythonParams,`
			`SparkSubmitParams: o.sparkSubmitParams,`
			`SqlParams: o.sqlParams,`

			`JobParameters: o.jobParams,`
			`}`

			`return payload, nil`
			`}`