package notebook import ( "errors" "io/fs" "os" "path/filepath" "testing" "github.com/databricks/databricks-sdk-go/service/workspace" "github.com/stretchr/testify/assert" "github.com/stretchr/testify/require" ) func TestDetectSource(t *testing.T) { var nb bool var lang workspace.Language var err error nb, lang, err = Detect("./testdata/py_source.py") require.NoError(t, err) assert.True(t, nb) assert.Equal(t, workspace.LanguagePython, lang) nb, lang, err = Detect("./testdata/r_source.r") require.NoError(t, err) assert.True(t, nb) assert.Equal(t, workspace.LanguageR, lang) nb, lang, err = Detect("./testdata/scala_source.scala") require.NoError(t, err) assert.True(t, nb) assert.Equal(t, workspace.LanguageScala, lang) nb, lang, err = Detect("./testdata/sql_source.sql") require.NoError(t, err) assert.True(t, nb) assert.Equal(t, workspace.LanguageSql, lang) nb, lang, err = Detect("./testdata/txt.txt") require.NoError(t, err) assert.False(t, nb) assert.Equal(t, workspace.Language(""), lang) } func TestDetectCallsDetectJupyter(t *testing.T) { nb, lang, err := Detect("./testdata/py_ipynb.ipynb") require.NoError(t, err) assert.True(t, nb) assert.Equal(t, workspace.LanguagePython, lang) } func TestDetectUnknownExtension(t *testing.T) { _, _, err := Detect("./testdata/doesntexist.foobar") assert.True(t, errors.Is(err, fs.ErrNotExist)) nb, _, err := Detect("./testdata/unknown_extension.foobar") require.NoError(t, err) assert.False(t, nb) } func TestDetectNoExtension(t *testing.T) { _, _, err := Detect("./testdata/doesntexist") assert.True(t, errors.Is(err, fs.ErrNotExist)) nb, _, err := Detect("./testdata/no_extension") require.NoError(t, err) assert.False(t, nb) } func TestDetectFileDoesNotExists(t *testing.T) { _, _, err := Detect("./testdata/doesntexist.py") require.Error(t, err) } func TestDetectEmptyFile(t *testing.T) { // Create empty file. dir := t.TempDir() path := filepath.Join(dir, "file.py") err := os.WriteFile(path, nil, 0644) require.NoError(t, err) // No contents means not a notebook. nb, _, err := Detect(path) require.NoError(t, err) assert.False(t, nb) } func TestDetectFileWithLongHeader(t *testing.T) { // Create 128kb garbage file. dir := t.TempDir() path := filepath.Join(dir, "file.py") buf := make([]byte, 128*1024) err := os.WriteFile(path, buf, 0644) require.NoError(t, err) // Garbage contents means not a notebook. nb, _, err := Detect(path) require.NoError(t, err) assert.False(t, nb) } func TestDetectWithObjectInfo(t *testing.T) { fakeFS := &fakeFS{ fakeFile{ fakeFileInfo{ workspace.ObjectInfo{ ObjectType: workspace.ObjectTypeNotebook, Language: workspace.LanguagePython, }, }, }, } nb, lang, err := DetectWithFS(fakeFS, "doesntmatter") require.NoError(t, err) assert.True(t, nb) assert.Equal(t, workspace.LanguagePython, lang) } func TestInMemoryFiles(t *testing.T) { isNotebook, language, err := DetectWithContent("hello.py", []byte("# Databricks notebook source\n print('hello')")) assert.True(t, isNotebook) assert.Equal(t, workspace.LanguagePython, language) require.NoError(t, err) isNotebook, language, err = DetectWithContent("hello.py", []byte("print('hello')")) assert.False(t, isNotebook) assert.Equal(t, workspace.Language(""), language) require.NoError(t, err) fileContent, err := os.ReadFile("./testdata/py_ipynb.ipynb") require.NoError(t, err) isNotebook, language, err = DetectWithContent("py_ipynb.ipynb", fileContent) assert.True(t, isNotebook) assert.Equal(t, workspace.LanguagePython, language) require.NoError(t, err) }