Test Tools > Validators

`TestValidateSublists`

Source code in tests/tools/test_validators.py

class TestValidateSublists:
    def test_equal_elements_and_order(
        self,
        list_with_equal_elements_equal_order,
    ):
        """Verify validate_sublists function with lists having identical
        elements in the same order.

        Parameters
        ----------
        list_with_equal_elements_equal_order : list
            Input provided by a fixture.

        Asserts
        -------
        The function returns True for lists with identical elements and order.
        """
        assert validate_sublists(list_with_equal_elements_equal_order)

    def test_equal_elements_and_different_order(
        self,
        list_with_equal_elements_different_order,
    ):
        """Verify validate_sublists function with lists having identical
        elements in different orders.

        Parameters
        ----------
        list_with_equal_elements_different_order : list
            Input provided by a fixture.

        Asserts
        -------
        The function returns True for lists with identical elements
        regardless of their order.
        """
        assert validate_sublists(list_with_equal_elements_different_order)

    def test_unequal_elements(self, list_with_unequal_elements):
        """Verify validate_sublists function with lists having different
        elements.

        Parameters
        ----------
        list_with_unequal_elements : list
            Input provided by a fixture.

        Asserts
        -------
        The function raises a ValueError for lists with differing elements.
        """
        with pytest.raises(ValueError) as excinfo:
            validate_sublists(list_with_unequal_elements)
        assert "Sublists do not have the same elements." in str(excinfo.value)

    def test_unequal_elements_and_unbalance(
        self,
        list_with_unequal_elements_and_unbalance,
    ):
        """Verify validate_sublists function with lists having different
        elements and lengths.

        Parameters
        ----------
        list_with_unequal_elements_and_unbalance : list
            Input provided by a fixture.

        Asserts
        -------
        The function raises a ValueError for lists with differing elements
        and lengths.
        """
        with pytest.raises(ValueError) as excinfo:
            validate_sublists(list_with_unequal_elements_and_unbalance)
        assert "Sublists do not have the same elements." in str(excinfo.value)

`test_equal_elements_and_different_order(list_with_equal_elements_different_order)`

Verify validate_sublists function with lists having identical elements in different orders.

Parameters

list_with_equal_elements_different_order : list Input provided by a fixture.

Asserts

The function returns True for lists with identical elements regardless of their order.

Source code in tests/tools/test_validators.py

def test_equal_elements_and_different_order(
    self,
    list_with_equal_elements_different_order,
):
    """Verify validate_sublists function with lists having identical
    elements in different orders.

    Parameters
    ----------
    list_with_equal_elements_different_order : list
        Input provided by a fixture.

    Asserts
    -------
    The function returns True for lists with identical elements
    regardless of their order.
    """
    assert validate_sublists(list_with_equal_elements_different_order)

`test_equal_elements_and_order(list_with_equal_elements_equal_order)`

Verify validate_sublists function with lists having identical elements in the same order.

Parameters

list_with_equal_elements_equal_order : list Input provided by a fixture.

Asserts

The function returns True for lists with identical elements and order.

Source code in tests/tools/test_validators.py

def test_equal_elements_and_order(
    self,
    list_with_equal_elements_equal_order,
):
    """Verify validate_sublists function with lists having identical
    elements in the same order.

    Parameters
    ----------
    list_with_equal_elements_equal_order : list
        Input provided by a fixture.

    Asserts
    -------
    The function returns True for lists with identical elements and order.
    """
    assert validate_sublists(list_with_equal_elements_equal_order)

`test_unequal_elements(list_with_unequal_elements)`

Verify validate_sublists function with lists having different elements.

Parameters

list_with_unequal_elements : list Input provided by a fixture.

Asserts

The function raises a ValueError for lists with differing elements.

Source code in tests/tools/test_validators.py

def test_unequal_elements(self, list_with_unequal_elements):
    """Verify validate_sublists function with lists having different
    elements.

    Parameters
    ----------
    list_with_unequal_elements : list
        Input provided by a fixture.

    Asserts
    -------
    The function raises a ValueError for lists with differing elements.
    """
    with pytest.raises(ValueError) as excinfo:
        validate_sublists(list_with_unequal_elements)
    assert "Sublists do not have the same elements." in str(excinfo.value)

`test_unequal_elements_and_unbalance(list_with_unequal_elements_and_unbalance)`

Verify validate_sublists function with lists having different elements and lengths.

Parameters

list_with_unequal_elements_and_unbalance : list Input provided by a fixture.

Asserts

The function raises a ValueError for lists with differing elements and lengths.

Source code in tests/tools/test_validators.py

def test_unequal_elements_and_unbalance(
    self,
    list_with_unequal_elements_and_unbalance,
):
    """Verify validate_sublists function with lists having different
    elements and lengths.

    Parameters
    ----------
    list_with_unequal_elements_and_unbalance : list
        Input provided by a fixture.

    Asserts
    -------
    The function raises a ValueError for lists with differing elements
    and lengths.
    """
    with pytest.raises(ValueError) as excinfo:
        validate_sublists(list_with_unequal_elements_and_unbalance)
    assert "Sublists do not have the same elements." in str(excinfo.value)

`list_with_equal_elements_different_order()`

Provide a list where sublists have identical elements in different orders.

Returns

list A list of sublists with equal elements in varying order.

Source code in tests/tools/test_validators.py

@pytest.fixture()
def list_with_equal_elements_different_order():
    """Provide a list where sublists have identical elements in different
    orders.

    Returns
    -------
    list
        A list of sublists with equal elements in varying order.
    """
    return [
        ["A", "B"],
        ["B", "A"],
    ]

`list_with_equal_elements_equal_order()`

Provide a list where sublists have identical elements in the same order.

Returns

list A list of sublists with equal elements in identical order.

Source code in tests/tools/test_validators.py

@pytest.fixture()
def list_with_equal_elements_equal_order():
    """Provide a list where sublists have identical elements in the same order.

    Returns
    -------
    list
        A list of sublists with equal elements in identical order.
    """
    return [
        ["A", "B"],
        ["A", "B"],
    ]

`list_with_unequal_elements()`

Provide a list where sublists have different elements.

Returns

list A list of sublists with unequal elements.

Source code in tests/tools/test_validators.py

@pytest.fixture()
def list_with_unequal_elements():
    """Provide a list where sublists have different elements.

    Returns
    -------
    list
        A list of sublists with unequal elements.
    """
    return [
        ["A", "B"],
        ["C", "A"],
    ]

`list_with_unequal_elements_and_unbalance()`

Provide a list where sublists have different elements and lengths.

Returns

list A list of sublists with unequal elements and varying lengths.

Source code in tests/tools/test_validators.py

@pytest.fixture()
def list_with_unequal_elements_and_unbalance():
    """Provide a list where sublists have different elements and lengths.

    Returns
    -------
    list
        A list of sublists with unequal elements and varying lengths.
    """
    return [
        ["A", "B", "C"],
        ["C", "A"],
    ]

`test_data_validation(tmp_path_factory, data_raw, file_name_log, data_schema, data_clean)`

Validate the functionality of validate_data_quality.

This test iterates through a series of predefined datasets, including both valid and invalid data, to verify the data quality validation process. It checks whether the function correctly processes valid data, identifies invalid data, and logs errors as expected.

Parameters

tmp_path_factory : _pytest.tmpdir.TempPathFactory A fixture provided by pytest to create temporary directories. data_raw : dict The raw data dictionary to be validated. Represents a single row of data intended for processing by the validate_data_quality function. file_name_log : str The name of the log file used to record validation errors. data_schema : BaseModel The Pydantic model that the raw data is validated against. data_clean : list The expected processed data outcome from the validation function, for comparison with the actual result.

Asserts

Asserts that the processed data matches the expected data_clean list. Additionally, it checks if the log file's existence aligns with the presence of invalid data, ensuring that logs are created only when there are validation errors.

Source code in tests/tools/test_validators.py

@pytest.mark.parametrize(
    "data_raw, file_name_log, data_schema, data_clean",
    data_for_validation_parameters,
)
def test_data_validation(
    tmp_path_factory,
    data_raw,
    file_name_log,
    data_schema,
    data_clean,
):
    """Validate the functionality of validate_data_quality.

    This test iterates through a series of predefined datasets, including
    both valid and invalid data, to verify the data quality validation
    process. It checks whether the function correctly processes valid data,
    identifies invalid data, and logs errors as expected.

    Parameters
    ----------
    tmp_path_factory : _pytest.tmpdir.TempPathFactory
        A fixture provided by pytest to create temporary directories.
    data_raw : dict
        The raw data dictionary to be validated. Represents a single row of
        data intended for processing by the validate_data_quality function.
    file_name_log : str
        The name of the log file used to record validation errors.
    data_schema : BaseModel
        The Pydantic model that the raw data is validated against.
    data_clean : list
        The expected processed data outcome from the validation function,
        for comparison with the actual result.

    Asserts
    -------
    Asserts that the processed data matches the expected data_clean list.
    Additionally, it checks if the log file's existence aligns with the
    presence of invalid data, ensuring that logs are created only when there
    are validation errors.
    """
    df = pd.DataFrame(
        data_raw,
        index=[0],
        dtype=str,
    )

    output_dir = tmp_path_factory.mktemp("data_validation")

    data_process = list(
        validate_data_quality(
            df,
            str(output_dir),
            file_name_log,
            data_schema,
        ),
    )

    if data_process:
        data_process_value = list(data_process[0].values())
        is_bad_data = False
    else:
        data_process_value = []
        is_bad_data = True

    log_output = "test_invalid_records.log"
    output_empty_file_path = output_dir / log_output

    assert data_process_value == data_clean
    assert os.path.exists(output_empty_file_path) == is_bad_data