package internal import ( "bytes" "context" "encoding/json" "errors" "io" "io/fs" "path" "regexp" "strings" "testing" "github.com/databricks/cli/libs/filer" "github.com/stretchr/testify/assert" "github.com/stretchr/testify/require" ) type filerTest struct { *testing.T filer.Filer } func (f filerTest) assertContents(ctx context.Context, name string, contents string) { reader, err := f.Read(ctx, name) if !assert.NoError(f, err) { return } defer reader.Close() var body bytes.Buffer _, err = io.Copy(&body, reader) if !assert.NoError(f, err) { return } assert.Equal(f, contents, body.String()) } func (f filerTest) assertContentsJupyter(ctx context.Context, name string, language string) { reader, err := f.Read(ctx, name) if !assert.NoError(f, err) { return } defer reader.Close() var body bytes.Buffer _, err = io.Copy(&body, reader) if !assert.NoError(f, err) { return } var actual map[string]any err = json.Unmarshal(body.Bytes(), &actual) if !assert.NoError(f, err) { return } // Since a roundtrip to the workspace changes a Jupyter notebook's payload, // the best we can do is assert that the nbformat is correct. assert.EqualValues(f, 4, actual["nbformat"]) assert.Equal(f, language, actual["metadata"].(map[string]any)["language_info"].(map[string]any)["name"]) } func (f filerTest) assertNotExists(ctx context.Context, name string) { _, err := f.Stat(ctx, name) assert.ErrorIs(f, err, fs.ErrNotExist) } func commonFilerRecursiveDeleteTest(t *testing.T, ctx context.Context, f filer.Filer) { var err error err = f.Write(ctx, "dir/file1", strings.NewReader("content1"), filer.CreateParentDirectories) require.NoError(t, err) filerTest{t, f}.assertContents(ctx, "dir/file1", `content1`) err = f.Write(ctx, "dir/file2", strings.NewReader("content2"), filer.CreateParentDirectories) require.NoError(t, err) filerTest{t, f}.assertContents(ctx, "dir/file2", `content2`) err = f.Write(ctx, "dir/subdir1/file3", strings.NewReader("content3"), filer.CreateParentDirectories) require.NoError(t, err) filerTest{t, f}.assertContents(ctx, "dir/subdir1/file3", `content3`) err = f.Write(ctx, "dir/subdir1/file4", strings.NewReader("content4"), filer.CreateParentDirectories) require.NoError(t, err) filerTest{t, f}.assertContents(ctx, "dir/subdir1/file4", `content4`) err = f.Write(ctx, "dir/subdir2/file5", strings.NewReader("content5"), filer.CreateParentDirectories) require.NoError(t, err) filerTest{t, f}.assertContents(ctx, "dir/subdir2/file5", `content5`) err = f.Write(ctx, "dir/subdir2/file6", strings.NewReader("content6"), filer.CreateParentDirectories) require.NoError(t, err) filerTest{t, f}.assertContents(ctx, "dir/subdir2/file6", `content6`) entriesBeforeDelete, err := f.ReadDir(ctx, "dir") require.NoError(t, err) assert.Len(t, entriesBeforeDelete, 4) names := []string{} for _, e := range entriesBeforeDelete { names = append(names, e.Name()) } assert.Equal(t, names, []string{"file1", "file2", "subdir1", "subdir2"}) err = f.Delete(ctx, "dir") assert.ErrorAs(t, err, &filer.DirectoryNotEmptyError{}) err = f.Delete(ctx, "dir", filer.DeleteRecursively) assert.NoError(t, err) _, err = f.ReadDir(ctx, "dir") assert.ErrorAs(t, err, &filer.NoSuchDirectoryError{}) } func TestFilerRecursiveDelete(t *testing.T) { t.Parallel() for _, testCase := range []struct { name string f func(t *testing.T) (filer.Filer, string) }{ {"local", setupLocalFiler}, {"workspace files", setupWsfsFiler}, {"dbfs", setupDbfsFiler}, {"files", setupUcVolumesFiler}, {"workspace files extensions", setupWsfsExtensionsFiler}, } { tc := testCase t.Run(testCase.name, func(t *testing.T) { t.Parallel() f, _ := tc.f(t) ctx := context.Background() // Common tests we run across all filers to ensure consistent behavior. commonFilerRecursiveDeleteTest(t, ctx, f) }) } } // Common tests we run across all filers to ensure consistent behavior. func commonFilerReadWriteTests(t *testing.T, ctx context.Context, f filer.Filer) { var err error // Write should fail because the intermediate directory doesn't exist. err = f.Write(ctx, "/foo/bar", strings.NewReader(`hello world`)) assert.True(t, errors.As(err, &filer.NoSuchDirectoryError{})) assert.True(t, errors.Is(err, fs.ErrNotExist)) // Read should fail because the intermediate directory doesn't yet exist. _, err = f.Read(ctx, "/foo/bar") assert.True(t, errors.As(err, &filer.FileDoesNotExistError{})) assert.True(t, errors.Is(err, fs.ErrNotExist)) // Read should fail because the path points to a directory err = f.Mkdir(ctx, "/dir") require.NoError(t, err) _, err = f.Read(ctx, "/dir") assert.ErrorIs(t, err, fs.ErrInvalid) // Write with CreateParentDirectories flag should succeed. err = f.Write(ctx, "/foo/bar", strings.NewReader(`hello world`), filer.CreateParentDirectories) assert.NoError(t, err) filerTest{t, f}.assertContents(ctx, "/foo/bar", `hello world`) // Write should fail because there is an existing file at the specified path. err = f.Write(ctx, "/foo/bar", strings.NewReader(`hello universe`)) assert.True(t, errors.As(err, &filer.FileAlreadyExistsError{})) assert.True(t, errors.Is(err, fs.ErrExist)) // Write with OverwriteIfExists should succeed. err = f.Write(ctx, "/foo/bar", strings.NewReader(`hello universe`), filer.OverwriteIfExists) assert.NoError(t, err) filerTest{t, f}.assertContents(ctx, "/foo/bar", `hello universe`) // Write should succeed if there is no existing file at the specified path. err = f.Write(ctx, "/foo/qux", strings.NewReader(`hello universe`)) assert.NoError(t, err) // Stat on a directory should succeed. // Note: size and modification time behave differently between backends. info, err := f.Stat(ctx, "/foo") require.NoError(t, err) assert.Equal(t, "foo", info.Name()) assert.True(t, info.Mode().IsDir()) assert.Equal(t, true, info.IsDir()) // Stat on a file should succeed. // Note: size and modification time behave differently between backends. info, err = f.Stat(ctx, "/foo/bar") require.NoError(t, err) assert.Equal(t, "bar", info.Name()) assert.True(t, info.Mode().IsRegular()) assert.Equal(t, false, info.IsDir()) // Delete should fail if the file doesn't exist. err = f.Delete(ctx, "/doesnt_exist") assert.ErrorAs(t, err, &filer.FileDoesNotExistError{}) assert.True(t, errors.Is(err, fs.ErrNotExist)) // Stat should fail if the file doesn't exist. _, err = f.Stat(ctx, "/doesnt_exist") assert.ErrorAs(t, err, &filer.FileDoesNotExistError{}) assert.True(t, errors.Is(err, fs.ErrNotExist)) // Delete should succeed for file that does exist. err = f.Delete(ctx, "/foo/bar") assert.NoError(t, err) // Delete should fail for a non-empty directory. err = f.Delete(ctx, "/foo") assert.ErrorAs(t, err, &filer.DirectoryNotEmptyError{}) assert.True(t, errors.Is(err, fs.ErrInvalid)) // Delete should succeed for a non-empty directory if the DeleteRecursively flag is set. err = f.Delete(ctx, "/foo", filer.DeleteRecursively) assert.NoError(t, err) // Delete of the filer root should ALWAYS fail, otherwise subsequent writes would fail. // It is not in the filer's purview to delete its root directory. err = f.Delete(ctx, "/") assert.True(t, errors.As(err, &filer.CannotDeleteRootError{})) assert.True(t, errors.Is(err, fs.ErrInvalid)) } func TestFilerReadWrite(t *testing.T) { t.Parallel() for _, testCase := range []struct { name string f func(t *testing.T) (filer.Filer, string) }{ {"local", setupLocalFiler}, {"workspace files", setupWsfsFiler}, {"dbfs", setupDbfsFiler}, {"files", setupUcVolumesFiler}, {"workspace files extensions", setupWsfsExtensionsFiler}, } { tc := testCase t.Run(testCase.name, func(t *testing.T) { t.Parallel() f, _ := tc.f(t) ctx := context.Background() // Common tests we run across all filers to ensure consistent behavior. commonFilerReadWriteTests(t, ctx, f) }) } } // Common tests we run across all filers to ensure consistent behavior. func commonFilerReadDirTest(t *testing.T, ctx context.Context, f filer.Filer) { var err error var info fs.FileInfo // We start with an empty directory. entries, err := f.ReadDir(ctx, ".") require.NoError(t, err) assert.Len(t, entries, 0) // Write a file. err = f.Write(ctx, "/hello.txt", strings.NewReader(`hello world`)) require.NoError(t, err) // Create a directory. err = f.Mkdir(ctx, "/dir") require.NoError(t, err) // Write a file. err = f.Write(ctx, "/dir/world.txt", strings.NewReader(`hello world`)) require.NoError(t, err) // Create a nested directory (check that it creates intermediate directories). err = f.Mkdir(ctx, "/dir/a/b/c") require.NoError(t, err) // Expect an error if the path doesn't exist. _, err = f.ReadDir(ctx, "/dir/a/b/c/d/e") assert.True(t, errors.As(err, &filer.NoSuchDirectoryError{}), err) assert.True(t, errors.Is(err, fs.ErrNotExist)) // Expect two entries in the root. entries, err = f.ReadDir(ctx, ".") require.NoError(t, err) assert.Len(t, entries, 2) assert.Equal(t, "dir", entries[0].Name()) assert.True(t, entries[0].IsDir()) assert.Equal(t, "hello.txt", entries[1].Name()) assert.False(t, entries[1].IsDir()) info, err = entries[1].Info() require.NoError(t, err) assert.Greater(t, info.ModTime().Unix(), int64(0)) // Expect two entries in the directory. entries, err = f.ReadDir(ctx, "/dir") require.NoError(t, err) assert.Len(t, entries, 2) assert.Equal(t, "a", entries[0].Name()) assert.True(t, entries[0].IsDir()) assert.Equal(t, "world.txt", entries[1].Name()) assert.False(t, entries[1].IsDir()) info, err = entries[1].Info() require.NoError(t, err) assert.Greater(t, info.ModTime().Unix(), int64(0)) // Expect a single entry in the nested path. entries, err = f.ReadDir(ctx, "/dir/a/b") require.NoError(t, err) assert.Len(t, entries, 1) assert.Equal(t, "c", entries[0].Name()) assert.True(t, entries[0].IsDir()) // Expect an error trying to call ReadDir on a file _, err = f.ReadDir(ctx, "/hello.txt") assert.ErrorIs(t, err, fs.ErrInvalid) // Expect 0 entries for an empty directory err = f.Mkdir(ctx, "empty-dir") require.NoError(t, err) entries, err = f.ReadDir(ctx, "empty-dir") assert.NoError(t, err) assert.Len(t, entries, 0) // Expect one entry for a directory with a file in it err = f.Write(ctx, "dir-with-one-file/my-file.txt", strings.NewReader("abc"), filer.CreateParentDirectories) require.NoError(t, err) entries, err = f.ReadDir(ctx, "dir-with-one-file") assert.NoError(t, err) assert.Len(t, entries, 1) assert.Equal(t, entries[0].Name(), "my-file.txt") assert.False(t, entries[0].IsDir()) } func TestFilerReadDir(t *testing.T) { t.Parallel() for _, testCase := range []struct { name string f func(t *testing.T) (filer.Filer, string) }{ {"local", setupLocalFiler}, {"workspace files", setupWsfsFiler}, {"dbfs", setupDbfsFiler}, {"files", setupUcVolumesFiler}, {"workspace files extensions", setupWsfsExtensionsFiler}, } { tc := testCase t.Run(testCase.name, func(t *testing.T) { t.Parallel() f, _ := tc.f(t) ctx := context.Background() commonFilerReadDirTest(t, ctx, f) }) } } func TestAccFilerWorkspaceNotebook(t *testing.T) { t.Parallel() for i := 0; i < 10; i++ { testAccFilerWorkspacenotebook(t) } } func testAccFilerWorkspacenotebook(t *testing.T) { ctx := context.Background() var err error tcases := []struct { name string nameWithoutExt string content1 string expected1 string content2 string expected2 string }{ { name: "pyNb.py", nameWithoutExt: "pyNb", content1: "# Databricks notebook source\nprint('first upload')", expected1: "# Databricks notebook source\nprint('first upload')", content2: "# Databricks notebook source\nprint('second upload')", expected2: "# Databricks notebook source\nprint('second upload')", }, { name: "rNb.r", nameWithoutExt: "rNb", content1: "# Databricks notebook source\nprint('first upload')", expected1: "# Databricks notebook source\nprint('first upload')", content2: "# Databricks notebook source\nprint('second upload')", expected2: "# Databricks notebook source\nprint('second upload')", }, { name: "sqlNb.sql", nameWithoutExt: "sqlNb", content1: "-- Databricks notebook source\n SELECT \"first upload\"", expected1: "-- Databricks notebook source\n SELECT \"first upload\"", content2: "-- Databricks notebook source\n SELECT \"second upload\"", expected2: "-- Databricks notebook source\n SELECT \"second upload\"", }, { name: "scalaNb.scala", nameWithoutExt: "scalaNb", content1: "// Databricks notebook source\n println(\"first upload\")", expected1: "// Databricks notebook source\n println(\"first upload\")", content2: "// Databricks notebook source\n println(\"second upload\")", expected2: "// Databricks notebook source\n println(\"second upload\")", }, { name: "pythonJupyterNb.ipynb", nameWithoutExt: "pythonJupyterNb", content1: readFile(t, "testdata/notebooks/py1.ipynb"), expected1: "# Databricks notebook source\nprint(1)", content2: readFile(t, "testdata/notebooks/py2.ipynb"), expected2: "# Databricks notebook source\nprint(2)", }, { name: "rJupyterNb.ipynb", nameWithoutExt: "rJupyterNb", content1: readFile(t, "testdata/notebooks/r1.ipynb"), expected1: "# Databricks notebook source\nprint(1)", content2: readFile(t, "testdata/notebooks/r2.ipynb"), expected2: "# Databricks notebook source\nprint(2)", }, { name: "scalaJupyterNb.ipynb", nameWithoutExt: "scalaJupyterNb", content1: readFile(t, "testdata/notebooks/scala1.ipynb"), expected1: "// Databricks notebook source\nprintln(1)", content2: readFile(t, "testdata/notebooks/scala2.ipynb"), expected2: "// Databricks notebook source\nprintln(2)", }, { name: "sqlJupyterNotebook.ipynb", nameWithoutExt: "sqlJupyterNotebook", content1: readFile(t, "testdata/notebooks/sql1.ipynb"), expected1: "-- Databricks notebook source\nselect 1", content2: readFile(t, "testdata/notebooks/sql2.ipynb"), expected2: "-- Databricks notebook source\nselect 2", }, } for _, tc := range tcases { f, _ := setupWsfsFiler(t) t.Run(tc.name, func(t *testing.T) { t.Parallel() // Upload the notebook err = f.Write(ctx, tc.name, strings.NewReader(tc.content1)) require.NoError(t, err) // Assert contents after initial upload. Note that we expect the content // for jupyter notebooks to be of type source because the workspace files // client always uses the source format to read notebooks from the workspace. filerTest{t, f}.assertContents(ctx, tc.nameWithoutExt, tc.expected1) // Assert uploading a second time fails due to overwrite mode missing err = f.Write(ctx, tc.name, strings.NewReader(tc.content2)) assert.ErrorIs(t, err, fs.ErrExist) assert.Regexp(t, regexp.MustCompile(`file already exists: .*/`+tc.nameWithoutExt+`$`), err.Error()) // Try uploading the notebook again with overwrite flag. This time it should succeed. err = f.Write(ctx, tc.name, strings.NewReader(tc.content2), filer.OverwriteIfExists) require.NoError(t, err) // Assert contents after second upload filerTest{t, f}.assertContents(ctx, tc.nameWithoutExt, tc.expected2) }) } } func TestFilerWorkspaceFilesExtensionsReadDir(t *testing.T) { t.Parallel() files := []struct { name string content string }{ {"dir1/dir2/dir3/file.txt", "file content"}, {"dir1/notebook.py", "# Databricks notebook source\nprint('first upload'))"}, {"foo.py", "print('foo')"}, {"foo.r", "print('foo')"}, {"foo.scala", "println('foo')"}, {"foo.sql", "SELECT 'foo'"}, {"py1.ipynb", readFile(t, "testdata/notebooks/py1.ipynb")}, {"pyNb.py", "# Databricks notebook source\nprint('first upload'))"}, {"r1.ipynb", readFile(t, "testdata/notebooks/r1.ipynb")}, {"rNb.r", "# Databricks notebook source\nprint('first upload'))"}, {"scala1.ipynb", readFile(t, "testdata/notebooks/scala1.ipynb")}, {"scalaNb.scala", "// Databricks notebook source\n println(\"first upload\"))"}, {"sql1.ipynb", readFile(t, "testdata/notebooks/sql1.ipynb")}, {"sqlNb.sql", "-- Databricks notebook source\n SELECT \"first upload\""}, } // Assert that every file has a unique basename basenames := map[string]struct{}{} for _, f := range files { basename := path.Base(f.name) if _, ok := basenames[basename]; ok { t.Fatalf("basename %s is not unique", basename) } basenames[basename] = struct{}{} } ctx := context.Background() wf, _ := setupWsfsExtensionsFiler(t) for _, f := range files { err := wf.Write(ctx, f.name, strings.NewReader(f.content), filer.CreateParentDirectories) require.NoError(t, err) } // Read entries entries, err := wf.ReadDir(ctx, ".") require.NoError(t, err) names := []string{} for _, e := range entries { names = append(names, e.Name()) } assert.Equal(t, []string{ "dir1", "foo.py", "foo.r", "foo.scala", "foo.sql", "py1.ipynb", "pyNb.py", "r1.ipynb", "rNb.r", "scala1.ipynb", "scalaNb.scala", "sql1.ipynb", "sqlNb.sql", }, names) // Read entries in subdirectory entries, err = wf.ReadDir(ctx, "dir1") require.NoError(t, err) names = []string{} for _, e := range entries { names = append(names, e.Name()) } assert.Equal(t, []string{ "dir2", "notebook.py", }, names) } func setupFilerWithExtensionsTest(t *testing.T) filer.Filer { files := []struct { name string content string }{ {"foo.py", "# Databricks notebook source\nprint('first upload'))"}, {"bar.py", "print('foo')"}, {"p1.ipynb", readFile(t, "testdata/notebooks/py1.ipynb")}, {"r1.ipynb", readFile(t, "testdata/notebooks/r1.ipynb")}, {"scala1.ipynb", readFile(t, "testdata/notebooks/scala1.ipynb")}, {"sql1.ipynb", readFile(t, "testdata/notebooks/sql1.ipynb")}, {"pretender", "not a notebook"}, {"dir/file.txt", "file content"}, {"scala-notebook.scala", "// Databricks notebook source\nprintln('first upload')"}, } ctx := context.Background() wf, _ := setupWsfsExtensionsFiler(t) for _, f := range files { err := wf.Write(ctx, f.name, strings.NewReader(f.content), filer.CreateParentDirectories) require.NoError(t, err) } return wf } func TestFilerWorkspaceFilesExtensionsRead(t *testing.T) { t.Parallel() ctx := context.Background() wf := setupFilerWithExtensionsTest(t) // Read contents of test fixtures as a sanity check. filerTest{t, wf}.assertContents(ctx, "foo.py", "# Databricks notebook source\nprint('first upload'))") filerTest{t, wf}.assertContents(ctx, "bar.py", "print('foo')") filerTest{t, wf}.assertContents(ctx, "dir/file.txt", "file content") filerTest{t, wf}.assertContents(ctx, "scala-notebook.scala", "// Databricks notebook source\nprintln('first upload')") filerTest{t, wf}.assertContents(ctx, "pretender", "not a notebook") filerTest{t, wf}.assertContentsJupyter(ctx, "p1.ipynb", "python") filerTest{t, wf}.assertContentsJupyter(ctx, "r1.ipynb", "r") filerTest{t, wf}.assertContentsJupyter(ctx, "scala1.ipynb", "scala") filerTest{t, wf}.assertContentsJupyter(ctx, "sql1.ipynb", "sql") // Read non-existent file _, err := wf.Read(ctx, "non-existent.py") assert.ErrorIs(t, err, fs.ErrNotExist) // Ensure we do not read a regular file as a notebook _, err = wf.Read(ctx, "pretender.py") assert.ErrorIs(t, err, fs.ErrNotExist) _, err = wf.Read(ctx, "pretender.ipynb") assert.ErrorIs(t, err, fs.ErrNotExist) // Read directory _, err = wf.Read(ctx, "dir") assert.ErrorIs(t, err, fs.ErrInvalid) // Ensure we do not read a Scala notebook as a Python notebook _, err = wf.Read(ctx, "scala-notebook.py") assert.ErrorIs(t, err, fs.ErrNotExist) } func testAccFilerWorkspaceFilesExtensionsDelete(t *testing.T) { ctx := context.Background() wf := setupFilerWithExtensionsTest(t) for _, fileName := range []string{ // notebook "foo.py", // file "bar.py", // python jupyter notebook "p1.ipynb", // R jupyter notebook "r1.ipynb", // Scala jupyter notebook "scala1.ipynb", // SQL jupyter notebook "sql1.ipynb", } { err := wf.Delete(ctx, fileName) require.NoError(t, err) filerTest{t, wf}.assertNotExists(ctx, fileName) } for _, fileName := range []string{ // do not delete non-existent file "non-existent.py", // do not delete a file assuming it is a notebook and stripping the extension "pretender.py", // do not delete a Scala notebook as a Python notebook "scala-notebook.py", // do not delete a file assuming it is a Jupyter notebook and stripping the extension "pretender.ipynb", } { err := wf.Delete(ctx, fileName) assert.ErrorIs(t, err, fs.ErrNotExist) } // Delete directory err := wf.Delete(ctx, "dir") assert.ErrorIs(t, err, fs.ErrInvalid) // Delete directory recursively err = wf.Delete(ctx, "dir", filer.DeleteRecursively) require.NoError(t, err) filerTest{t, wf}.assertNotExists(ctx, "dir") } func TestAccFilerWorkspaceFilesExtensionsDelete(t *testing.T) { t.Parallel() for i := 0; i < 10; i++ { testAccFilerWorkspaceFilesExtensionsDelete(t) } } func TestFilerWorkspaceFilesExtensionsStat(t *testing.T) { t.Parallel() ctx := context.Background() wf := setupFilerWithExtensionsTest(t) for _, fileName := range []string{ // notebook "foo.py", // file "bar.py", // python jupyter notebook "p1.ipynb", // R jupyter notebook "r1.ipynb", // Scala jupyter notebook "scala1.ipynb", // SQL jupyter notebook "sql1.ipynb", } { info, err := wf.Stat(ctx, fileName) require.NoError(t, err) assert.Equal(t, fileName, info.Name()) assert.False(t, info.IsDir()) } // Stat on a directory info, err := wf.Stat(ctx, "dir") require.NoError(t, err) assert.Equal(t, "dir", info.Name()) assert.True(t, info.IsDir()) for _, fileName := range []string{ // non-existent file "non-existent.py", // do not stat a file assuming it is a notebook and stripping the extension "pretender.py", // do not stat a Scala notebook as a Python notebook "scala-notebook.py", // do not read a regular file assuming it is a Jupyter notebook and stripping the extension "pretender.ipynb", } { _, err := wf.Stat(ctx, fileName) assert.ErrorIs(t, err, fs.ErrNotExist) } } func TestWorkspaceFilesExtensionsDirectoriesAreNotNotebooks(t *testing.T) { t.Parallel() ctx := context.Background() wf, _ := setupWsfsExtensionsFiler(t) // Create a directory with an extension err := wf.Mkdir(ctx, "foo") require.NoError(t, err) // Reading foo.py should fail. foo is a directory, not a notebook. _, err = wf.Read(ctx, "foo.py") assert.ErrorIs(t, err, fs.ErrNotExist) } func TestWorkspaceFilesExtensionsNotebooksAreNotReadAsFiles(t *testing.T) { t.Parallel() ctx := context.Background() wf, _ := setupWsfsExtensionsFiler(t) // Create a notebook err := wf.Write(ctx, "foo.ipynb", strings.NewReader(readFile(t, "testdata/notebooks/py1.ipynb"))) require.NoError(t, err) // Reading foo should fail. Even though the WSFS name for the notebook is foo // reading the notebook should only work with the .ipynb extension. _, err = wf.Read(ctx, "foo") assert.ErrorIs(t, err, fs.ErrNotExist) _, err = wf.Read(ctx, "foo.ipynb") assert.NoError(t, err) } func TestWorkspaceFilesExtensionsNotebooksAreNotStatAsFiles(t *testing.T) { t.Parallel() ctx := context.Background() wf, _ := setupWsfsExtensionsFiler(t) // Create a notebook err := wf.Write(ctx, "foo.ipynb", strings.NewReader(readFile(t, "testdata/notebooks/py1.ipynb"))) require.NoError(t, err) // Stating foo should fail. Even though the WSFS name for the notebook is foo // stating the notebook should only work with the .ipynb extension. _, err = wf.Stat(ctx, "foo") assert.ErrorIs(t, err, fs.ErrNotExist) _, err = wf.Stat(ctx, "foo.ipynb") assert.NoError(t, err) } func testAccWorkspaceFilesExtensionsNotebooksAreNotDeletedAsFiles(t *testing.T) { ctx := context.Background() wf, _ := setupWsfsExtensionsFiler(t) // Create a notebook err := wf.Write(ctx, "foo.ipynb", strings.NewReader(readFile(t, "testdata/notebooks/py1.ipynb"))) require.NoError(t, err) // Deleting foo should fail. Even though the WSFS name for the notebook is foo // deleting the notebook should only work with the .ipynb extension. err = wf.Delete(ctx, "foo") assert.ErrorIs(t, err, fs.ErrNotExist) err = wf.Delete(ctx, "foo.ipynb") assert.NoError(t, err) } func TestAccWorkspaceFilesExtensionsNotebooksAreNotDeletedAsFiles(t *testing.T) { t.Parallel() for i := 0; i < 10; i++ { testAccWorkspaceFilesExtensionsNotebooksAreNotDeletedAsFiles(t) } } func TestWorkspaceFilesExtensions_ExportFormatIsPreserved(t *testing.T) { t.Parallel() // Case 1: Writing source notebooks. for _, tc := range []struct { language string sourceName string sourceContent string jupyterName string jupyterContent string }{ { language: "python", sourceName: "foo.py", sourceContent: "# Databricks notebook source\nprint('foo')", jupyterName: "foo.ipynb", }, { language: "r", sourceName: "foo.r", sourceContent: "# Databricks notebook source\nprint('foo')", jupyterName: "foo.ipynb", }, { language: "scala", sourceName: "foo.scala", sourceContent: "// Databricks notebook source\nprintln('foo')", jupyterName: "foo.ipynb", }, { language: "sql", sourceName: "foo.sql", sourceContent: "-- Databricks notebook source\nselect 'foo'", jupyterName: "foo.ipynb", }, } { t.Run("source_"+tc.language, func(t *testing.T) { t.Parallel() ctx := context.Background() wf, _ := setupWsfsExtensionsFiler(t) err := wf.Write(ctx, tc.sourceName, strings.NewReader(tc.sourceContent)) require.NoError(t, err) // Assert on the content of the source notebook that's been written. filerTest{t, wf}.assertContents(ctx, tc.sourceName, tc.sourceContent) // Ensure that the source notebook is not read when the name contains // the .ipynb extension. _, err = wf.Stat(ctx, tc.jupyterName) assert.ErrorIs(t, err, fs.ErrNotExist) _, err = wf.Read(ctx, tc.jupyterName) assert.ErrorIs(t, err, fs.ErrNotExist) err = wf.Delete(ctx, tc.jupyterName) assert.ErrorIs(t, err, fs.ErrNotExist) }) } // Case 2: Writing Jupyter notebooks. for _, tc := range []struct { language string sourceName string jupyterName string jupyterContent string }{ { language: "python", sourceName: "foo.py", jupyterName: "foo.ipynb", jupyterContent: readFile(t, "testdata/notebooks/py1.ipynb"), }, { language: "r", sourceName: "foo.r", jupyterName: "foo.ipynb", jupyterContent: readFile(t, "testdata/notebooks/r1.ipynb"), }, { language: "scala", sourceName: "foo.scala", jupyterName: "foo.ipynb", jupyterContent: readFile(t, "testdata/notebooks/scala1.ipynb"), }, { language: "sql", sourceName: "foo.sql", jupyterName: "foo.ipynb", jupyterContent: readFile(t, "testdata/notebooks/sql1.ipynb"), }, } { t.Run("jupyter_"+tc.language, func(t *testing.T) { t.Parallel() ctx := context.Background() wf, _ := setupWsfsExtensionsFiler(t) err := wf.Write(ctx, tc.jupyterName, strings.NewReader(tc.jupyterContent)) require.NoError(t, err) // Assert that the written notebook is jupyter and has the correct // language_info metadata set. filerTest{t, wf}.assertContentsJupyter(ctx, tc.jupyterName, tc.language) // Ensure that the Jupyter notebook is not read when the name does not // contain the .ipynb extension. _, err = wf.Stat(ctx, tc.sourceName) assert.ErrorIs(t, err, fs.ErrNotExist) _, err = wf.Read(ctx, tc.sourceName) assert.ErrorIs(t, err, fs.ErrNotExist) err = wf.Delete(ctx, tc.sourceName) assert.ErrorIs(t, err, fs.ErrNotExist) }) } }