You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@dolphinscheduler.apache.org by zh...@apache.org on 2022/01/04 02:09:48 UTC
[dolphinscheduler] branch dev updated: [python] Add test for examples (#7759)
This is an automated email from the ASF dual-hosted git repository.
zhongjiajie pushed a commit to branch dev
in repository https://gitbox.apache.org/repos/asf/dolphinscheduler.git
The following commit(s) were added to refs/heads/dev by this push:
new f324b2f [python] Add test for examples (#7759)
f324b2f is described below
commit f324b2f88408d8a8b348fbd5ef3bd5686508c5e3
Author: Jiajie Zhong <zh...@hotmail.com>
AuthorDate: Tue Jan 4 10:09:38 2022 +0800
[python] Add test for examples (#7759)
* Make sure all file with `.py` extension and all file
end with "_example"
* Make sure all examples have `__doc__`
* Make sure not have duplicate process definition name
* Make sure process definition same as filename
close: #7729
---
.../{bulk_create.py => bulk_create_example.py} | 0
.../examples/task_datax_example.py | 2 +-
.../examples/task_dependent_example.py | 2 +-
.../examples/task_switch_example.py | 2 +-
.../pydolphinscheduler/tests/example/__init__.py | 18 +++
.../tests/example/test_example.py | 159 +++++++++++++++++++++
6 files changed, 180 insertions(+), 3 deletions(-)
diff --git a/dolphinscheduler-python/pydolphinscheduler/examples/bulk_create.py b/dolphinscheduler-python/pydolphinscheduler/examples/bulk_create_example.py
similarity index 100%
rename from dolphinscheduler-python/pydolphinscheduler/examples/bulk_create.py
rename to dolphinscheduler-python/pydolphinscheduler/examples/bulk_create_example.py
diff --git a/dolphinscheduler-python/pydolphinscheduler/examples/task_datax_example.py b/dolphinscheduler-python/pydolphinscheduler/examples/task_datax_example.py
index c9ca80c..1832921 100644
--- a/dolphinscheduler-python/pydolphinscheduler/examples/task_datax_example.py
+++ b/dolphinscheduler-python/pydolphinscheduler/examples/task_datax_example.py
@@ -32,7 +32,7 @@ from pydolphinscheduler.tasks.datax import CustomDataX, DataX
JSON_TEMPLATE = ""
with ProcessDefinition(
- name="task_datax",
+ name="task_datax_example",
tenant="tenant_exists",
) as pd:
# This task synchronizes the data in `t_ds_project`
diff --git a/dolphinscheduler-python/pydolphinscheduler/examples/task_dependent_example.py b/dolphinscheduler-python/pydolphinscheduler/examples/task_dependent_example.py
index 68f2a57..73b91aa 100644
--- a/dolphinscheduler-python/pydolphinscheduler/examples/task_dependent_example.py
+++ b/dolphinscheduler-python/pydolphinscheduler/examples/task_dependent_example.py
@@ -49,7 +49,7 @@ with ProcessDefinition(
pd.submit()
with ProcessDefinition(
- name="task_dependent",
+ name="task_dependent_example",
tenant="tenant_exists",
) as pd:
task = Dependent(
diff --git a/dolphinscheduler-python/pydolphinscheduler/examples/task_switch_example.py b/dolphinscheduler-python/pydolphinscheduler/examples/task_switch_example.py
index 5ab2aa5..b47b8e3 100644
--- a/dolphinscheduler-python/pydolphinscheduler/examples/task_switch_example.py
+++ b/dolphinscheduler-python/pydolphinscheduler/examples/task_switch_example.py
@@ -34,7 +34,7 @@ from pydolphinscheduler.tasks.shell import Shell
from pydolphinscheduler.tasks.switch import Branch, Default, Switch, SwitchCondition
with ProcessDefinition(
- name="task_dependent_external",
+ name="task_switch_example",
tenant="tenant_exists",
) as pd:
parent = Shell(name="parent", command="echo parent")
diff --git a/dolphinscheduler-python/pydolphinscheduler/tests/example/__init__.py b/dolphinscheduler-python/pydolphinscheduler/tests/example/__init__.py
new file mode 100644
index 0000000..49323e7
--- /dev/null
+++ b/dolphinscheduler-python/pydolphinscheduler/tests/example/__init__.py
@@ -0,0 +1,18 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Init example package tests."""
diff --git a/dolphinscheduler-python/pydolphinscheduler/tests/example/test_example.py b/dolphinscheduler-python/pydolphinscheduler/tests/example/test_example.py
new file mode 100644
index 0000000..bf980ed
--- /dev/null
+++ b/dolphinscheduler-python/pydolphinscheduler/tests/example/test_example.py
@@ -0,0 +1,159 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Test example."""
+
+import ast
+import importlib
+
+# import os
+# import os
+from pathlib import Path
+from unittest.mock import patch
+
+import pytest
+
+from tests.testing.task import Task
+
+process_definition_name = set()
+
+
+def get_all_example_define():
+ """Get all examples files in examples directory."""
+ return (
+ path
+ for path in Path(__file__).parent.parent.parent.joinpath("examples").iterdir()
+ if path.is_file()
+ )
+
+
+def import_module(script_name, script_path):
+ """Import and run example module in examples directory."""
+ spec = importlib.util.spec_from_file_location(script_name, script_path)
+ module = importlib.util.module_from_spec(spec)
+ spec.loader.exec_module(module)
+ return module
+
+
+@pytest.fixture
+def setup_and_teardown_for_stuff():
+ """Fixture of py.test handle setup and teardown."""
+ yield
+ global process_definition_name
+ process_definition_name = set()
+
+
+def submit_check_without_same_name(self):
+ """Side effect for verifying process definition name and adding it to global variable."""
+ if self.name in process_definition_name:
+ raise ValueError(
+ "Example process definition should not have same name, but get duplicate name: %s",
+ self.name,
+ )
+ submit_add_process_definition(self)
+
+
+def submit_add_process_definition(self):
+ """Side effect for adding process definition name to global variable."""
+ process_definition_name.add(self.name)
+
+
+def test_example_basic():
+ """Test example basic information.
+
+ Which including:
+ * File extension name is `.py`
+ * All example except `tutorial.py` is end with keyword "_example"
+ * All example must have not empty `__doc__`.
+ """
+ for ex in get_all_example_define():
+ # All files in example is python script
+ assert (
+ ex.suffix == ".py"
+ ), f"We expect all examples is python script, but get {ex.name}."
+
+ # All except tutorial is end with keyword "_example"
+ if ex.stem != "tutorial":
+ assert ex.stem.endswith(
+ "_example"
+ ), f"We expect all examples script end with keyword '_example', but get {ex.stem}."
+
+ # All files have __doc__
+ tree = ast.parse(ex.read_text())
+ example_doc = ast.get_docstring(tree, clean=False)
+ assert (
+ example_doc is not None
+ ), f"We expect all examples have __doc__, but {ex.name} do not."
+
+
+@patch("pydolphinscheduler.core.process_definition.ProcessDefinition.start")
+@patch(
+ "pydolphinscheduler.core.process_definition.ProcessDefinition.submit",
+ side_effect=submit_check_without_same_name,
+ autospec=True,
+)
+@patch(
+ "pydolphinscheduler.core.task.Task.gen_code_and_version",
+ # Example bulk_create_example.py would create workflow dynamic by :func:`get_one_task_by_name`
+ # and would raise error in :func:`get_one_task_by_name` if we return constant value
+ # using :arg:`return_value`
+ side_effect=Task("test_example", "test_example").gen_code_and_version,
+)
+def test_example_process_definition_without_same_name(
+ mock_code_version, mock_submit, mock_start
+):
+ """Test all examples file without same process definition's name.
+
+ Our process definition would compete with others if we have same process definition name. It will make
+ different between actually workflow and our workflow-as-code file which make users feel strange.
+ """
+ for ex in get_all_example_define():
+ # We use side_effect `submit_check_without_same_name` overwrite :func:`submit`
+ # and check whether it have duplicate name or not
+ import_module(ex.name, str(ex))
+ assert True
+
+
+@patch("pydolphinscheduler.core.process_definition.ProcessDefinition.start")
+@patch(
+ "pydolphinscheduler.core.process_definition.ProcessDefinition.submit",
+ side_effect=submit_add_process_definition,
+ autospec=True,
+)
+@patch(
+ "pydolphinscheduler.core.task.Task.gen_code_and_version",
+ # Example bulk_create_example.py would create workflow dynamic by :func:`get_one_task_by_name`
+ # and would raise error in :func:`get_one_task_by_name` if we return constant value
+ # using :arg:`return_value`
+ side_effect=Task("test_example", "test_example").gen_code_and_version,
+)
+def test_file_name_in_process_definition(mock_code_version, mock_submit, mock_start):
+ """Test example file name in example definition name.
+
+ We should not directly assert equal, because some of the examples contain
+ more than one process definition.
+ """
+ global process_definition_name
+ for ex in get_all_example_define():
+ # Skip bulk_create_example check, cause it contain multiple workflow and
+ # without one named bulk_create_example
+ if ex.stem == "bulk_create_example":
+ continue
+ process_definition_name = set()
+ assert ex.stem not in process_definition_name
+ import_module(ex.name, str(ex))
+ assert ex.stem in process_definition_name