Files
data-platform/tests/test_ops.py
2026-03-12 13:36:06 +00:00

139 lines
4.7 KiB
Python

"""Tests for Dagster ops — elementary and source freshness."""
from unittest.mock import patch
import pytest
from dagster import build_op_context
from data_platform.ops.check_source_freshness import (
SourceFreshnessConfig,
)
from data_platform.ops.elementary import (
_elementary_schema_exists,
elementary_generate_report,
elementary_run_models,
)
# SourceFreshnessConfig
class TestSourceFreshnessConfig:
def test_accepts_source_name(self):
cfg = SourceFreshnessConfig(source_name="raw_funda")
assert cfg.source_name == "raw_funda"
# _elementary_schema_exists
class TestElementarySchemaExists:
@patch("data_platform.resources._retry_on_operational_error")
@patch("data_platform.ops.elementary.create_engine")
def test_returns_true_when_schema_present(self, mock_create_engine, mock_retry):
mock_retry.return_value = True
with patch.dict(
"os.environ",
{
"POSTGRES_USER": "u",
"POSTGRES_PASSWORD": "p",
"POSTGRES_HOST": "localhost",
"POSTGRES_PORT": "5432",
"POSTGRES_DB": "db",
},
):
result = _elementary_schema_exists()
assert result is True
mock_create_engine.assert_called_once()
@patch("data_platform.resources._retry_on_operational_error")
@patch("data_platform.ops.elementary.create_engine")
def test_returns_false_when_schema_absent(self, mock_create_engine, mock_retry):
mock_retry.return_value = False
with patch.dict(
"os.environ",
{
"POSTGRES_USER": "u",
"POSTGRES_PASSWORD": "p",
"POSTGRES_HOST": "localhost",
"POSTGRES_PORT": "5432",
"POSTGRES_DB": "db",
},
):
result = _elementary_schema_exists()
assert result is False
# elementary_run_models
def _mock_popen(returncode=0, stdout_lines=None):
"""Create a mock Popen instance with streaming stdout."""
from unittest.mock import MagicMock
proc = MagicMock()
proc.stdout = iter(stdout_lines or [])
proc.wait.return_value = returncode
return proc
class TestElementaryRunModels:
@patch("data_platform.ops.elementary._elementary_schema_exists", return_value=True)
def test_skips_when_schema_exists(self, mock_exists):
context = build_op_context()
elementary_run_models(context)
mock_exists.assert_called_once()
@patch("data_platform.ops.elementary.subprocess.Popen")
@patch("data_platform.ops.elementary._elementary_schema_exists", return_value=False)
def test_runs_dbt_when_schema_missing(self, mock_exists, mock_popen):
mock_popen.return_value = _mock_popen(returncode=0, stdout_lines=["ok\n"])
context = build_op_context()
elementary_run_models(context)
mock_popen.assert_called_once()
args = mock_popen.call_args[0][0]
assert "dbt" in args
assert "run" in args
assert "elementary" in args
@patch("data_platform.ops.elementary.subprocess.Popen")
@patch("data_platform.ops.elementary._elementary_schema_exists", return_value=False)
def test_raises_on_dbt_failure(self, mock_exists, mock_popen):
mock_popen.return_value = _mock_popen(returncode=1, stdout_lines=["error\n"])
context = build_op_context()
with pytest.raises(Exception, match="dbt run elementary failed"):
elementary_run_models(context)
# elementary_generate_report
class TestElementaryGenerateReport:
@patch("data_platform.ops.elementary.subprocess.Popen")
def test_calls_edr_report(self, mock_popen):
mock_popen.return_value = _mock_popen(
returncode=0, stdout_lines=["report generated\n"]
)
context = build_op_context()
elementary_generate_report(context)
mock_popen.assert_called_once()
args = mock_popen.call_args[0][0]
assert "edr" in args
assert "report" in args
@patch("data_platform.ops.elementary.subprocess.Popen")
def test_raises_on_failure(self, mock_popen):
mock_popen.return_value = _mock_popen(
returncode=1, stdout_lines=["fatal error\n"]
)
context = build_op_context()
with pytest.raises(Exception, match="edr report failed"):
elementary_generate_report(context)
@patch("data_platform.ops.elementary.subprocess.Popen")
def test_success_returns_none(self, mock_popen):
mock_popen.return_value = _mock_popen(returncode=0, stdout_lines=["done\n"])
context = build_op_context()
result = elementary_generate_report(context)
assert result is None