ehrql / Git / [e988c2] /tests/integration/query_engines/test

Models:
philipB/
ehrql
Downloads: 1
[e988c2]: / tests / integration / query_engines / test_mssql.py
History
Download this file
89 lines (76 with data), 3.0 kB

import contextlib
from unittest import mock

import pytest
import sqlalchemy.sql
from sqlalchemy.engine import Connection
from sqlalchemy.exc import OperationalError, ProgrammingError

from ehrql.query_model.nodes import (
    AggregateByPatient,
    Column,
    Dataset,
    SelectColumn,
    SelectPatientTable,
    TableSchema,
)


def test_get_results_with_retries(mssql_engine):
    # Define a simple query and load some test data
    patient_table = SelectPatientTable("patients", TableSchema(i=Column(int)))
    dataset = Dataset(
        population=AggregateByPatient.Exists(patient_table),
        variables={"i": SelectColumn(patient_table, "i")},
        events={},
        measures=None,
    )
    mssql_engine.populate(
        {
            patient_table: [
                dict(patient_id=1, i=10),
                dict(patient_id=2, i=20),
            ]
        }
    )

    with wrap_select_queries() as select, mock.patch("time.sleep") as sleep:
        # We want the first two SELECT queries to fail but the third to succeed
        select.side_effect = [
            OperationalError("fail", None, None),
            OperationalError("fail again", None, None),
            None,
        ]

        results = mssql_engine.extract(dataset)

        assert results == [
            {"patient_id": 1, "i": 10},
            {"patient_id": 2, "i": 20},
        ]
        assert select.call_count == 3
        # We expect to sleep after each failure
        assert sleep.call_count == 2
        # Grab a reference to the SELECT query so we can use it later
        query = select.call_args[0][0]

    # Check that the table we were querying has now been cleaned up
    with mssql_engine.sqlalchemy_engine().connect() as conn:
        with pytest.raises(ProgrammingError, match="Invalid object name"):
            conn.execute(query)


@contextlib.contextmanager
def wrap_select_queries():
    """
    Intercept SELECT queries so we can track them, and optionally raise exceptions,
    while still calling the original database methods and passing the result through
    """
    original = Connection.execute
    mocked = mock.Mock()

    def wrapper(self, *args, **kwargs):
        if args and isinstance(args[0], sqlalchemy.sql.Select):
            try:
                mocked(*args, **kwargs)
            except Exception:
                # Simulate hitting a low-level error from the database driver which
                # causes SQLAlchemy to invalidate the connection. Ideally we would be
                # able to trigger a lower level error which causes SQLAlchemy to do this
                # itself. But I've tried and failed to do so, partly because the
                # `pymssql` driver we use is a compiled library and so less amenable to
                # monkey patching.
                self.invalidate()
                raise
        return original(self, *args, **kwargs)

    with mock.patch.object(Connection, "execute", wrapper):
        yield mocked