databricks-cli/libs/notebook/detect_test.go

139 lines
3.5 KiB
Go

package notebook
import (
"errors"
"io/fs"
"os"
"path/filepath"
"testing"
"github.com/databricks/databricks-sdk-go/service/workspace"
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/require"
)
func TestDetectSource(t *testing.T) {
var nb bool
var lang workspace.Language
var err error
nb, lang, err = Detect("./testdata/py_source.py")
require.NoError(t, err)
assert.True(t, nb)
assert.Equal(t, workspace.LanguagePython, lang)
nb, lang, err = Detect("./testdata/r_source.r")
require.NoError(t, err)
assert.True(t, nb)
assert.Equal(t, workspace.LanguageR, lang)
nb, lang, err = Detect("./testdata/scala_source.scala")
require.NoError(t, err)
assert.True(t, nb)
assert.Equal(t, workspace.LanguageScala, lang)
nb, lang, err = Detect("./testdata/sql_source.sql")
require.NoError(t, err)
assert.True(t, nb)
assert.Equal(t, workspace.LanguageSql, lang)
nb, lang, err = Detect("./testdata/txt.txt")
require.NoError(t, err)
assert.False(t, nb)
assert.Equal(t, workspace.Language(""), lang)
}
func TestDetectCallsDetectJupyter(t *testing.T) {
nb, lang, err := Detect("./testdata/py_ipynb.ipynb")
require.NoError(t, err)
assert.True(t, nb)
assert.Equal(t, workspace.LanguagePython, lang)
}
func TestDetectUnknownExtension(t *testing.T) {
_, _, err := Detect("./testdata/doesntexist.foobar")
assert.True(t, errors.Is(err, fs.ErrNotExist))
nb, _, err := Detect("./testdata/unknown_extension.foobar")
require.NoError(t, err)
assert.False(t, nb)
}
func TestDetectNoExtension(t *testing.T) {
_, _, err := Detect("./testdata/doesntexist")
assert.True(t, errors.Is(err, fs.ErrNotExist))
nb, _, err := Detect("./testdata/no_extension")
require.NoError(t, err)
assert.False(t, nb)
}
func TestDetectFileDoesNotExists(t *testing.T) {
_, _, err := Detect("./testdata/doesntexist.py")
require.Error(t, err)
}
func TestDetectEmptyFile(t *testing.T) {
// Create empty file.
dir := t.TempDir()
path := filepath.Join(dir, "file.py")
err := os.WriteFile(path, nil, 0644)
require.NoError(t, err)
// No contents means not a notebook.
nb, _, err := Detect(path)
require.NoError(t, err)
assert.False(t, nb)
}
func TestDetectFileWithLongHeader(t *testing.T) {
// Create 128kb garbage file.
dir := t.TempDir()
path := filepath.Join(dir, "file.py")
buf := make([]byte, 128*1024)
err := os.WriteFile(path, buf, 0644)
require.NoError(t, err)
// Garbage contents means not a notebook.
nb, _, err := Detect(path)
require.NoError(t, err)
assert.False(t, nb)
}
func TestDetectWithObjectInfo(t *testing.T) {
fakeFS := &fakeFS{
fakeFile{
fakeFileInfo{
workspace.ObjectInfo{
ObjectType: workspace.ObjectTypeNotebook,
Language: workspace.LanguagePython,
},
},
},
}
nb, lang, err := DetectWithFS(fakeFS, "doesntmatter")
require.NoError(t, err)
assert.True(t, nb)
assert.Equal(t, workspace.LanguagePython, lang)
}
func TestInMemoryFiles(t *testing.T) {
isNotebook, language, err := DetectWithContent("hello.py", []byte("# Databricks notebook source\n print('hello')"))
assert.True(t, isNotebook)
assert.Equal(t, workspace.LanguagePython, language)
require.NoError(t, err)
isNotebook, language, err = DetectWithContent("hello.py", []byte("print('hello')"))
assert.False(t, isNotebook)
assert.Equal(t, workspace.Language(""), language)
require.NoError(t, err)
fileContent, err := os.ReadFile("./testdata/py_ipynb.ipynb")
require.NoError(t, err)
isNotebook, language, err = DetectWithContent("py_ipynb.ipynb", fileContent)
assert.True(t, isNotebook)
assert.Equal(t, workspace.LanguagePython, language)
require.NoError(t, err)
}