From 37d677c079bc86d55f188e0ae1a659837fcbeca8 Mon Sep 17 00:00:00 2001 From: Gleb Kanterov Date: Wed, 25 Sep 2024 16:11:58 +0200 Subject: [PATCH 1/5] PythonMutator: Add tests for import --- .../dataclass_no_wheel/databricks.yml | 15 +++ .../notebooks/my_notebook.py | 2 + .../dataclass_no_wheel/src/my_job.py | 22 +++++ bundle/tests/python_import_test.go | 95 +++++++++++++++++++ 4 files changed, 134 insertions(+) create mode 100644 bundle/tests/python_import/dataclass_no_wheel/databricks.yml create mode 100644 bundle/tests/python_import/dataclass_no_wheel/notebooks/my_notebook.py create mode 100644 bundle/tests/python_import/dataclass_no_wheel/src/my_job.py create mode 100644 bundle/tests/python_import_test.go diff --git a/bundle/tests/python_import/dataclass_no_wheel/databricks.yml b/bundle/tests/python_import/dataclass_no_wheel/databricks.yml new file mode 100644 index 0000000000..a2531e1228 --- /dev/null +++ b/bundle/tests/python_import/dataclass_no_wheel/databricks.yml @@ -0,0 +1,15 @@ +bundle: + name: python-import-dataclass-no-wheel + +experimental: + pydabs: + enabled: true + import: + - "my_job" + +variables: + default_cluster_spec: + type: complex + value: + num_workers: 1 + spark_version: "15.4.x-scala2.12" diff --git a/bundle/tests/python_import/dataclass_no_wheel/notebooks/my_notebook.py b/bundle/tests/python_import/dataclass_no_wheel/notebooks/my_notebook.py new file mode 100644 index 0000000000..8d8fcd56f7 --- /dev/null +++ b/bundle/tests/python_import/dataclass_no_wheel/notebooks/my_notebook.py @@ -0,0 +1,2 @@ +# Databricks Notebook Source +1+1 diff --git a/bundle/tests/python_import/dataclass_no_wheel/src/my_job.py b/bundle/tests/python_import/dataclass_no_wheel/src/my_job.py new file mode 100644 index 0000000000..15896296ad --- /dev/null +++ b/bundle/tests/python_import/dataclass_no_wheel/src/my_job.py @@ -0,0 +1,22 @@ +from databricks.bundles.jobs import Job, Task, NotebookTask, JobCluster +from databricks.bundles.variables import Bundle + +my_job = Job( + name="Test Job", + resource_name="my_job", + job_clusters=[ + JobCluster( + job_cluster_key="my_cluster", + new_cluster=Bundle.variables.default_cluster_spec, + ), + ], + tasks=[ + Task( + task_key="my_notebook_task", + job_cluster_key="my_cluster", + notebook_task=NotebookTask( + notebook_path="notebooks/my_notebook.py", + ), + ), + ], +) diff --git a/bundle/tests/python_import_test.go b/bundle/tests/python_import_test.go new file mode 100644 index 0000000000..d99991d1d4 --- /dev/null +++ b/bundle/tests/python_import_test.go @@ -0,0 +1,95 @@ +package config_tests + +import ( + "os" + "os/exec" + pathlib "path" + "runtime" + "testing" + + "github.com/databricks/cli/bundle/config/resources" + "github.com/databricks/cli/libs/dyn" + "github.com/databricks/databricks-sdk-go/service/jobs" + "github.com/stretchr/testify/require" + "golang.org/x/exp/maps" + + "github.com/stretchr/testify/assert" +) + +func TestDataclassNoWheel(t *testing.T) { + activateVEnv(t) + setPythonPath(t, "python_import/dataclass_no_wheel/src") + + expected := &resources.Job{ + JobSettings: &jobs.JobSettings{ + Name: "Test Job", + JobClusters: []jobs.JobCluster{ + { + JobClusterKey: "my_cluster", + }, + }, + Tasks: []jobs.Task{ + { + NotebookTask: &jobs.NotebookTask{ + NotebookPath: "notebooks/my_notebook.py", + }, + JobClusterKey: "my_cluster", + TaskKey: "my_notebook_task", + }, + }, + }, + } + + b := load(t, "./python_import/dataclass_no_wheel") + + assert.Equal(t, []string{"my_job"}, maps.Keys(b.Config.Resources.Jobs)) + + myJob := b.Config.Resources.Jobs["my_job"] + assert.Equal(t, expected, myJob) + + // NewCluster is reference to a variable and needs to be checked separately + err := b.Config.Mutate(func(value dyn.Value) (dyn.Value, error) { + path := dyn.MustPathFromString("resources.jobs.my_job.job_clusters[0].new_cluster") + value, err := dyn.GetByPath(value, path) + if err != nil { + return dyn.InvalidValue, err + } + + assert.Equal(t, "${var.default_cluster_spec}", value.AsAny()) + + return value, nil + }) + require.NoError(t, err) +} + +func setPythonPath(t *testing.T, path string) { + wd, err := os.Getwd() + require.NoError(t, err) + t.Setenv("PYTHONPATH", pathlib.Join(wd, path)) +} + +func activateVEnv(t *testing.T) { + dir := t.TempDir() + venvDir := pathlib.Join(dir, "venv") + + err := exec.Command("python3", "-m", "venv", venvDir).Run() + require.NoError(t, err) + + // we don't have shell to activate venv, updating PATH is enough + + var venvBinDir string + if runtime.GOOS == "Windows" { + venvBinDir = pathlib.Join(venvDir, "Scripts") + t.Setenv("PATH", venvBinDir+";"+os.Getenv("PATH")) + } else { + venvBinDir = pathlib.Join(venvDir, "bin") + t.Setenv("PATH", venvBinDir+":"+os.Getenv("PATH")) + } + + err = exec.Command( + pathlib.Join(venvBinDir, "pip"), + "install", + "databricks-pydabs==0.5.1", + ).Run() + require.NoError(t, err) +} From 6fd701ec849dbfc6ee9ca9fad787f208c5674d60 Mon Sep 17 00:00:00 2001 From: Gleb Kanterov Date: Wed, 25 Sep 2024 16:24:59 +0200 Subject: [PATCH 2/5] Bump python version --- .github/workflows/push.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/push.yml b/.github/workflows/push.yml index 02bf73784d..b9859508e8 100644 --- a/.github/workflows/push.yml +++ b/.github/workflows/push.yml @@ -38,7 +38,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v5 with: - python-version: '3.9' + python-version: '3.10' - name: Set go env run: | From 55c36bc2fac28b475e7cab170e11efeb3749884e Mon Sep 17 00:00:00 2001 From: Gleb Kanterov Date: Wed, 25 Sep 2024 16:25:52 +0200 Subject: [PATCH 3/5] Better error messages --- bundle/tests/python_import_test.go | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/bundle/tests/python_import_test.go b/bundle/tests/python_import_test.go index d99991d1d4..f2093cebee 100644 --- a/bundle/tests/python_import_test.go +++ b/bundle/tests/python_import_test.go @@ -73,7 +73,7 @@ func activateVEnv(t *testing.T) { venvDir := pathlib.Join(dir, "venv") err := exec.Command("python3", "-m", "venv", venvDir).Run() - require.NoError(t, err) + require.NoError(t, err, "failed to create venv") // we don't have shell to activate venv, updating PATH is enough @@ -91,5 +91,5 @@ func activateVEnv(t *testing.T) { "install", "databricks-pydabs==0.5.1", ).Run() - require.NoError(t, err) + require.NoError(t, err, "failed to install databricks-pydabs") } From 6b4641c53032f1b54fd949aaceeddb903626965b Mon Sep 17 00:00:00 2001 From: Gleb Kanterov Date: Wed, 25 Sep 2024 16:28:13 +0200 Subject: [PATCH 4/5] Fix test name --- bundle/tests/python_import_test.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/bundle/tests/python_import_test.go b/bundle/tests/python_import_test.go index f2093cebee..e7ac54596f 100644 --- a/bundle/tests/python_import_test.go +++ b/bundle/tests/python_import_test.go @@ -16,7 +16,7 @@ import ( "github.com/stretchr/testify/assert" ) -func TestDataclassNoWheel(t *testing.T) { +func TestPythonImport_dataclass_no_wheel(t *testing.T) { activateVEnv(t) setPythonPath(t, "python_import/dataclass_no_wheel/src") From bbcbffd7f4104b126a60fb80964773189b603f8c Mon Sep 17 00:00:00 2001 From: Gleb Kanterov Date: Wed, 25 Sep 2024 16:35:28 +0200 Subject: [PATCH 5/5] Fix windows --- bundle/tests/python_import_test.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/bundle/tests/python_import_test.go b/bundle/tests/python_import_test.go index e7ac54596f..ff6dd632d4 100644 --- a/bundle/tests/python_import_test.go +++ b/bundle/tests/python_import_test.go @@ -78,7 +78,7 @@ func activateVEnv(t *testing.T) { // we don't have shell to activate venv, updating PATH is enough var venvBinDir string - if runtime.GOOS == "Windows" { + if runtime.GOOS == "windows" { venvBinDir = pathlib.Join(venvDir, "Scripts") t.Setenv("PATH", venvBinDir+";"+os.Getenv("PATH")) } else {