Retry app deployment if there is an active deployment in progress (#2153)

## Changes
If before running an app, the app was stopped with an active deployment,
then Apps backend start it and does the auto-deploy of the last active
deployment. In such cases StartApp API won't return any active or
pending deployments in its response but doing the deploy immediately
after the start might result in the error `Cannot deploy app *** as
there is an active deployment in progress`.

From DABs side, we have to do a new deployment on every `bundle run`
(command which start the app and does deployment) because local files in
bundle might have been changed and users expect to have the app running
with new code.

Thus this PR works around the error by catching “deployment in progress”
error, getting any active / pending deployments, waits for them to
finish and start the new deployment again. If 2nd attempts fails, the
whole command fails.

## Tests
Added unit test.
This commit is contained in:
Andrew Nester 2025-01-15 12:51:06 +01:00 committed by GitHub
parent 626045a17e
commit dd554412a6
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 106 additions and 10 deletions

View File

@ -10,6 +10,7 @@ import (
"github.com/databricks/cli/bundle/config/resources" "github.com/databricks/cli/bundle/config/resources"
"github.com/databricks/cli/bundle/run/output" "github.com/databricks/cli/bundle/run/output"
"github.com/databricks/cli/libs/cmdio" "github.com/databricks/cli/libs/cmdio"
"github.com/databricks/databricks-sdk-go"
"github.com/databricks/databricks-sdk-go/service/apps" "github.com/databricks/databricks-sdk-go/service/apps"
"github.com/spf13/cobra" "github.com/spf13/cobra"
) )
@ -111,11 +112,21 @@ func (a *appRunner) start(ctx context.Context) error {
// active and pending deployments fields (if any). If there are active or pending deployments, // active and pending deployments fields (if any). If there are active or pending deployments,
// we need to wait for them to complete before we can do the new deployment. // we need to wait for them to complete before we can do the new deployment.
// Otherwise, the new deployment will fail. // Otherwise, the new deployment will fail.
// Thus, we first wait for the active deployment to complete. err = waitForDeploymentToComplete(ctx, w, startedApp)
if startedApp.ActiveDeployment != nil && if err != nil {
startedApp.ActiveDeployment.Status.State == apps.AppDeploymentStateInProgress { return err
}
logProgress(ctx, "App is started!")
return nil
}
func waitForDeploymentToComplete(ctx context.Context, w *databricks.WorkspaceClient, app *apps.App) error {
// We first wait for the active deployment to complete.
if app.ActiveDeployment != nil &&
app.ActiveDeployment.Status.State == apps.AppDeploymentStateInProgress {
logProgress(ctx, "Waiting for the active deployment to complete...") logProgress(ctx, "Waiting for the active deployment to complete...")
_, err = w.Apps.WaitGetDeploymentAppSucceeded(ctx, app.Name, startedApp.ActiveDeployment.DeploymentId, 20*time.Minute, nil) _, err := w.Apps.WaitGetDeploymentAppSucceeded(ctx, app.Name, app.ActiveDeployment.DeploymentId, 20*time.Minute, nil)
if err != nil { if err != nil {
return err return err
} }
@ -123,17 +134,16 @@ func (a *appRunner) start(ctx context.Context) error {
} }
// Then, we wait for the pending deployment to complete. // Then, we wait for the pending deployment to complete.
if startedApp.PendingDeployment != nil && if app.PendingDeployment != nil &&
startedApp.PendingDeployment.Status.State == apps.AppDeploymentStateInProgress { app.PendingDeployment.Status.State == apps.AppDeploymentStateInProgress {
logProgress(ctx, "Waiting for the pending deployment to complete...") logProgress(ctx, "Waiting for the pending deployment to complete...")
_, err = w.Apps.WaitGetDeploymentAppSucceeded(ctx, app.Name, startedApp.PendingDeployment.DeploymentId, 20*time.Minute, nil) _, err := w.Apps.WaitGetDeploymentAppSucceeded(ctx, app.Name, app.PendingDeployment.DeploymentId, 20*time.Minute, nil)
if err != nil { if err != nil {
return err return err
} }
logProgress(ctx, "Pending deployment is completed!") logProgress(ctx, "Pending deployment is completed!")
} }
logProgress(ctx, "App is started!")
return nil return nil
} }
@ -142,18 +152,40 @@ func (a *appRunner) deploy(ctx context.Context) error {
b := a.bundle b := a.bundle
w := b.WorkspaceClient() w := b.WorkspaceClient()
sourceCodePath := app.SourceCodePath
wait, err := w.Apps.Deploy(ctx, apps.CreateAppDeploymentRequest{ wait, err := w.Apps.Deploy(ctx, apps.CreateAppDeploymentRequest{
AppName: app.Name, AppName: app.Name,
AppDeployment: &apps.AppDeployment{ AppDeployment: &apps.AppDeployment{
Mode: apps.AppDeploymentModeSnapshot, Mode: apps.AppDeploymentModeSnapshot,
SourceCodePath: app.SourceCodePath, SourceCodePath: sourceCodePath,
}, },
}) })
// If deploy returns an error, then there's an active deployment in progress, wait for it to complete. // If deploy returns an error, then there's an active deployment in progress, wait for it to complete.
// For this we first need to get an app and its acrive and pending deployments and then wait for them.
if err != nil {
app, err := w.Apps.Get(ctx, apps.GetAppRequest{Name: app.Name})
if err != nil {
return fmt.Errorf("failed to get app %s: %w", app.Name, err)
}
err = waitForDeploymentToComplete(ctx, w, app)
if err != nil { if err != nil {
return err return err
} }
// Now we can try to deploy the app again
wait, err = w.Apps.Deploy(ctx, apps.CreateAppDeploymentRequest{
AppName: app.Name,
AppDeployment: &apps.AppDeployment{
Mode: apps.AppDeploymentModeSnapshot,
SourceCodePath: sourceCodePath,
},
})
if err != nil {
return err
}
}
_, err = wait.OnProgress(func(ad *apps.AppDeployment) { _, err = wait.OnProgress(func(ad *apps.AppDeployment) {
if ad.Status == nil { if ad.Status == nil {
return return

View File

@ -3,6 +3,7 @@ package run
import ( import (
"bytes" "bytes"
"context" "context"
"errors"
"os" "os"
"path/filepath" "path/filepath"
"testing" "testing"
@ -189,6 +190,69 @@ func TestAppRunWithAnActiveDeploymentInProgress(t *testing.T) {
r.run(t) r.run(t)
} }
func TestAppDeployWithDeploymentInProgress(t *testing.T) {
ctx, b, mwc := setupBundle(t)
appApi := mwc.GetMockAppsAPI()
appApi.EXPECT().Get(mock.Anything, apps.GetAppRequest{
Name: "my_app",
}).Return(&apps.App{
Name: "my_app",
AppStatus: &apps.ApplicationStatus{
State: apps.ApplicationStateRunning,
},
ComputeStatus: &apps.ComputeStatus{
State: apps.ComputeStateActive,
},
}, nil).Once()
wait := &apps.WaitGetDeploymentAppSucceeded[apps.AppDeployment]{
Poll: func(_ time.Duration, _ func(*apps.AppDeployment)) (*apps.AppDeployment, error) {
return nil, nil
},
}
// First deployment fails
appApi.EXPECT().Deploy(mock.Anything, apps.CreateAppDeploymentRequest{
AppName: "my_app",
AppDeployment: &apps.AppDeployment{
Mode: apps.AppDeploymentModeSnapshot,
SourceCodePath: "/Workspace/Users/foo@bar.com/files/my_app",
},
}).Return(nil, errors.New("deployment in progress")).Once()
// After first deployment fails, we should get the app and wait for the deployment to complete
appApi.EXPECT().Get(mock.Anything, apps.GetAppRequest{
Name: "my_app",
}).Return(&apps.App{
Name: "my_app",
ActiveDeployment: &apps.AppDeployment{
DeploymentId: "active_deployment_id",
Status: &apps.AppDeploymentStatus{
State: apps.AppDeploymentStateInProgress,
},
},
}, nil).Once()
appApi.EXPECT().WaitGetDeploymentAppSucceeded(mock.Anything, "my_app", "active_deployment_id", mock.Anything, mock.Anything).Return(nil, nil)
// Second one should succeeed
appApi.EXPECT().Deploy(mock.Anything, apps.CreateAppDeploymentRequest{
AppName: "my_app",
AppDeployment: &apps.AppDeployment{
Mode: apps.AppDeploymentModeSnapshot,
SourceCodePath: "/Workspace/Users/foo@bar.com/files/my_app",
},
}).Return(wait, nil).Once()
r := &testAppRunner{
m: mwc,
b: b,
ctx: ctx,
}
r.run(t)
}
func TestStopApp(t *testing.T) { func TestStopApp(t *testing.T) {
ctx, b, mwc := setupBundle(t) ctx, b, mwc := setupBundle(t)
appsApi := mwc.GetMockAppsAPI() appsApi := mwc.GetMockAppsAPI()