From bfed446a98ea3d8af4702d349315b465602e51fb Mon Sep 17 00:00:00 2001
From: Andrew Montanez <amontanez2424@gmail.com>
Date: Fri, 28 Jul 2023 15:05:01 -0500
Subject: [PATCH 1/4] reorganizing tests and adding integration test

---
 tests/integration/single_table/test_base.py   | 750 ----------------
 .../single_table/test_constraints.py          | 810 ++++++++++++++++++
 2 files changed, 810 insertions(+), 750 deletions(-)
 create mode 100644 tests/integration/single_table/test_constraints.py

diff --git a/tests/integration/single_table/test_base.py b/tests/integration/single_table/test_base.py
index 8e1b3706b..0176e477a 100644
--- a/tests/integration/single_table/test_base.py
+++ b/tests/integration/single_table/test_base.py
@@ -1,20 +1,15 @@
 import datetime
-from unittest.mock import patch
 
-import numpy as np
 import pandas as pd
 import pkg_resources
 import pytest
-from copulas.multivariate.gaussian import GaussianMultivariate
 from rdt.transformers import AnonymizedFaker, FloatFormatter, LabelEncoder, RegexGenerator
 
-from sdv.datasets.demo import download_demo
 from sdv.metadata import SingleTableMetadata
 from sdv.sampling import Condition
 from sdv.single_table import (
     CopulaGANSynthesizer, CTGANSynthesizer, GaussianCopulaSynthesizer, TVAESynthesizer)
 from sdv.single_table.base import BaseSingleTableSynthesizer
-from tests.integration.single_table.custom_constraints import MyConstraint
 
 METADATA = SingleTableMetadata.load_from_dict({
     'METADATA_SPEC_VERSION': 'SINGLE_TABLE_V1',
@@ -39,13 +34,6 @@
 ]
 
 
-def _isinstance_side_effect(*args, **kwargs):
-    if isinstance(args[0], GaussianMultivariate):
-        return True
-    else:
-        return isinstance(args[0], args[1])
-
-
 @pytest.mark.parametrize('synthesizer', SYNTHESIZERS)
 def test_conditional_sampling_graceful_reject_sampling_true_dict(synthesizer):
     data = pd.DataFrame({
@@ -86,265 +74,6 @@ def test_conditional_sampling_graceful_reject_sampling_true_dataframe(synthesize
         synthesizer.sample_remaining_columns(conditions)
 
 
-def test_fit_with_unique_constraint_on_data_with_only_index_column():
-    """Test that the ``fit`` method runs without error when metadata specifies unique constraint,
-    ``fit`` is called on data containing a column named index.
-
-    The ``fit`` method is expected to fit the model to data,
-    taking into account the metadata and the ``Unique`` constraint.
-
-    Setup:
-    - The model is passed the unique constraint and
-    the primary key column.
-
-    Input:
-    - Data, Unique constraint
-
-    Github Issue:
-    - Tests that https://github.com/sdv-dev/SDV/issues/616 does not occur
-    """
-    # Setup
-    test_df = pd.DataFrame({
-        'key': [
-            1,
-            2,
-            3,
-            4,
-            5,
-        ],
-        'index': [
-            'A',
-            'B',
-            'C',
-            'D',
-            'E',
-        ]
-    })
-
-    metadata = SingleTableMetadata()
-    metadata.add_column('key', sdtype='id')
-    metadata.add_column('index', sdtype='categorical')
-    metadata.set_primary_key('key')
-
-    model = GaussianCopulaSynthesizer(metadata)
-    constraint = {
-        'constraint_class': 'Unique',
-        'constraint_parameters': {
-            'column_names': ['index']
-        }
-    }
-    model.add_constraints([constraint])
-
-    # Run
-    model.fit(test_df)
-    samples = model.sample(2)
-
-    # Assert
-    assert len(samples) == 2
-    assert samples['index'].is_unique
-
-
-def test_fit_with_unique_constraint_on_data_which_has_index_column():
-    """Test that the ``fit`` method runs without error when metadata specifies unique constraint,
-    ``fit`` is called on data containing a column named index and other columns.
-
-    The ``fit`` method is expected to fit the model to data,
-    taking into account the metadata and the ``Unique`` constraint.
-
-    Setup:
-    - The model is passed the unique constraint and
-    the primary key column.
-    - The unique constraint is set on the ``test_column``
-
-    Input:
-    - Data, Unique constraint
-
-    Github Issue:
-    - Tests that https://github.com/sdv-dev/SDV/issues/616 does not occur
-    """
-    # Setup
-    test_df = pd.DataFrame({
-        'key': [
-            1,
-            2,
-            3,
-            4,
-            5,
-        ],
-        'index': [
-            'A',
-            'B',
-            'C',
-            'D',
-            'E',
-        ],
-        'test_column': [
-            'A1',
-            'B2',
-            'C3',
-            'D4',
-            'E5',
-        ]
-    })
-
-    metadata = SingleTableMetadata()
-    metadata.add_column('key', sdtype='id')
-    metadata.add_column('index', sdtype='categorical')
-    metadata.add_column('test_column', sdtype='categorical')
-    metadata.set_primary_key('key')
-
-    model = GaussianCopulaSynthesizer(metadata)
-    constraint = {
-        'constraint_class': 'Unique',
-        'constraint_parameters': {
-            'column_names': ['test_column']
-        }
-    }
-    model.add_constraints([constraint])
-
-    # Run
-    model.fit(test_df)
-    samples = model.sample(2)
-
-    # Assert
-    assert len(samples) == 2
-    assert samples['test_column'].is_unique
-
-
-def test_fit_with_unique_constraint_on_data_subset():
-    """Test that the ``fit`` method runs without error when metadata specifies unique constraint,
-    ``fit`` is called on a subset of the original data.
-
-    The ``fit`` method is expected to fit the model to the subset of data,
-    taking into account the metadata and the ``Unique`` constraint.
-
-    Setup:
-    - The model is passed a ``Unique`` constraint and is
-    matched to a subset of the specified data.
-    Subdividing the data results in missing indexes in the subset contained in the original data.
-
-    Input:
-    - Subset of data, unique constraint
-
-    Github Issue:
-    - Tests that https://github.com/sdv-dev/SDV/issues/610 does not occur
-    """
-    # Setup
-    test_df = pd.DataFrame({
-        'key': [
-            1,
-            2,
-            3,
-            4,
-            5,
-        ],
-        'test_column': [
-            'A',
-            'B',
-            'C',
-            'D',
-            'E',
-        ]
-    })
-
-    metadata = SingleTableMetadata()
-    metadata.add_column('key', sdtype='id')
-    metadata.add_column('test_column', sdtype='categorical')
-    metadata.set_primary_key('key')
-
-    test_df = test_df.iloc[[1, 3, 4]]
-    constraint = {
-        'constraint_class': 'Unique',
-        'constraint_parameters': {
-            'column_names': ['test_column']
-        }
-    }
-    model = GaussianCopulaSynthesizer(metadata)
-    model.add_constraints([constraint])
-
-    # Run
-    model.fit(test_df)
-    samples = model.sample(2)
-
-    # Assert
-    assert len(samples) == 2
-    assert samples['test_column'].is_unique
-
-
-@patch('sdv.single_table.base.isinstance')
-@patch('sdv.single_table.copulas.multivariate.GaussianMultivariate',
-       spec_set=GaussianMultivariate)
-def test_conditional_sampling_constraint_uses_reject_sampling(gm_mock, isinstance_mock):
-    """Test that the ``sample`` method handles constraints with conditions.
-
-    The ``sample`` method is expected to properly apply constraint
-    transformations by dropping columns that cannot be conditonally sampled
-    on due to them being part of a constraint.
-
-    Setup:
-    - The model is being passed a ``UniqueCombination`` constraint and then
-    asked to sample with two conditions, one of which the constraint depends on.
-    The constraint is expected to skip its transformations since only some of
-    the columns are provided by the conditions and the model will use reject
-    sampling to meet the constraint instead.
-
-    Input:
-    - Conditions
-    Side Effects:
-    - Correct columns to condition on are passed to underlying sample method
-    """
-    # Setup
-    isinstance_mock.side_effect = _isinstance_side_effect
-    data = pd.DataFrame({
-        'city': ['LA', 'SF', 'CHI', 'LA', 'LA'],
-        'state': ['CA', 'CA', 'IL', 'CA', 'CA'],
-        'age': [27, 28, 26, 21, 30]
-    })
-
-    metadata = SingleTableMetadata()
-    metadata.add_column('city', sdtype='categorical')
-    metadata.add_column('state', sdtype='categorical')
-    metadata.add_column('age', sdtype='numerical')
-
-    model = GaussianCopulaSynthesizer(metadata)
-
-    constraint = {
-        'constraint_class': 'FixedCombinations',
-        'constraint_parameters': {
-            'column_names': ['city', 'state']
-        }
-    }
-    model.add_constraints([constraint])
-    sampled_numeric_data = [
-        pd.DataFrame({
-            'city#state': [0, 1, 2, 0, 0],
-            'age': [30, 30, 30, 30, 30]
-        }),
-        pd.DataFrame({
-            'city#state': [1],
-            'age': [30]
-        })
-    ]
-    gm_mock.return_value.sample.side_effect = sampled_numeric_data
-    model.fit(data)
-
-    # Run
-    conditions = [Condition({'age': 30, 'state': 'CA'}, num_rows=5)]
-    sampled_data = model.sample_from_conditions(conditions=conditions)
-
-    # Assert
-    expected_transformed_conditions = {'age': 30}
-    expected_data = pd.DataFrame({
-        'city': ['LA', 'SF', 'LA', 'LA', 'SF'],
-        'state': ['CA', 'CA', 'CA', 'CA', 'CA'],
-        'age': [30, 30, 30, 30, 30]
-    })
-    sample_calls = model._model.sample.mock_calls
-    assert len(sample_calls) == 2
-    model._model.sample.assert_any_call(5, conditions=expected_transformed_conditions)
-    pd.testing.assert_frame_equal(sampled_data, expected_data)
-
-
 def test_sample_from_conditions_with_batch_size():
     """Test the ``sample_from_conditions`` method with a different ``batch_size``.
 
@@ -584,101 +313,6 @@ def test_modeling_with_complex_datetimes():
     synth.validate(sampled)
 
 
-def test_custom_constraints_from_file(tmpdir):
-    """Ensure the correct loading for a custom constraint class defined in another file."""
-    data = pd.DataFrame({
-        'primary_key': ['user-000', 'user-001', 'user-002'],
-        'pii_col': ['223 Williams Rd', '75 Waltham St', '77 Mass Ave'],
-        'numerical_col': [2, 3, 4],
-        'categorical_col': ['a', 'b', 'a'],
-    })
-
-    metadata = SingleTableMetadata()
-    metadata.detect_from_dataframe(data)
-    metadata.update_column(column_name='pii_col', sdtype='address', pii=True)
-    synthesizer = GaussianCopulaSynthesizer(
-        metadata,
-        enforce_min_max_values=False,
-        enforce_rounding=False
-    )
-    synthesizer.load_custom_constraint_classes(
-        'tests/integration/single_table/custom_constraints.py',
-        ['MyConstraint']
-    )
-    constraint = {
-        'constraint_class': 'MyConstraint',
-        'constraint_parameters': {
-            'column_names': ['numerical_col']
-        }
-    }
-
-    # Run
-    synthesizer.add_constraints([constraint])
-    processed_data = synthesizer.preprocess(data)
-
-    # Assert Processed Data
-    assert all(processed_data['numerical_col'] == data['numerical_col'] ** 2)
-
-    # Run - Fit the model
-    synthesizer.fit_processed_data(processed_data)
-
-    # Run - sample
-    sampled = synthesizer.sample(10)
-    assert all(sampled['numerical_col'] > 1)
-
-    # Run - Save and Sample
-    synthesizer.save(tmpdir / 'test.pkl')
-    loaded_instance = synthesizer.load(tmpdir / 'test.pkl')
-    loaded_sampled = loaded_instance.sample(10)
-    assert all(loaded_sampled['numerical_col'] > 1)
-
-
-def test_custom_constraints_from_object(tmpdir):
-    """Ensure the correct loading for a custom constraint class passed as an object."""
-    data = pd.DataFrame({
-        'primary_key': ['user-000', 'user-001', 'user-002'],
-        'pii_col': ['223 Williams Rd', '75 Waltham St', '77 Mass Ave'],
-        'numerical_col': [2, 3, 4],
-        'categorical_col': ['a', 'b', 'a'],
-    })
-
-    metadata = SingleTableMetadata()
-    metadata.detect_from_dataframe(data)
-    metadata.update_column(column_name='pii_col', sdtype='address', pii=True)
-    synthesizer = GaussianCopulaSynthesizer(
-        metadata,
-        enforce_min_max_values=False,
-        enforce_rounding=False
-    )
-    synthesizer.add_custom_constraint_class(MyConstraint, 'MyConstraint')
-    constraint = {
-        'constraint_class': 'MyConstraint',
-        'constraint_parameters': {
-            'column_names': ['numerical_col']
-        }
-    }
-
-    # Run
-    synthesizer.add_constraints([constraint])
-    processed_data = synthesizer.preprocess(data)
-
-    # Assert Processed Data
-    assert all(processed_data['numerical_col'] == data['numerical_col'] ** 2)
-
-    # Run - Fit the model
-    synthesizer.fit_processed_data(processed_data)
-
-    # Run - sample
-    sampled = synthesizer.sample(10)
-    assert all(sampled['numerical_col'] > 1)
-
-    # Run - Save and Sample
-    synthesizer.save(tmpdir / 'test.pkl')
-    loaded_instance = synthesizer.load(tmpdir / 'test.pkl')
-    loaded_sampled = loaded_instance.sample(10)
-    assert all(loaded_sampled['numerical_col'] > 1)
-
-
 def test_auto_assign_transformers_and_update_with_pii():
     """Ensure the ability to update a transformer with any given ``pii`` sdtype.
 
@@ -782,390 +416,6 @@ def test_get_info():
     }
 
 
-def test_synthesizer_with_inequality_constraint():
-    """Ensure that the ``Inequality`` constraint can sample from the model."""
-    # Setup
-    real_data, metadata = download_demo(
-        modality='single_table',
-        dataset_name='fake_hotel_guests'
-    )
-    synthesizer = GaussianCopulaSynthesizer(metadata)
-    checkin_lessthan_checkout = {
-        'constraint_class': 'Inequality',
-        'constraint_parameters': {
-            'low_column_name': 'checkin_date',
-            'high_column_name': 'checkout_date'
-        }
-    }
-
-    synthesizer.add_constraints([checkin_lessthan_checkout])
-    synthesizer.fit(real_data)
-
-    # Run and Assert
-    sampled = synthesizer.sample(num_rows=500)
-    synthesizer.validate(sampled)
-    _sampled = sampled[~sampled['checkout_date'].isna()]
-    assert all(
-        pd.to_datetime(_sampled['checkin_date']) < pd.to_datetime(_sampled['checkout_date'])
-    )
-
-
-def test_inequality_constraint_with_datetimes_and_nones():
-    """Test that the ``Inequality`` constraint works with ``None`` and ``datetime``."""
-    # Setup
-    data = pd.DataFrame(data={
-        'A': [None, None, '2020-01-02', '2020-03-04'] * 2,
-        'B': [None, '2021-03-04', '2021-12-31', None] * 2
-    })
-
-    metadata = SingleTableMetadata.load_from_dict({
-        'columns': {
-            'A': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
-            'B': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'}
-        }
-    })
-
-    metadata.validate()
-    synth = GaussianCopulaSynthesizer(metadata)
-    synth.add_constraints([
-        {
-            'constraint_class': 'Inequality',
-            'constraint_parameters': {
-                'low_column_name': 'A',
-                'high_column_name': 'B'
-            }
-        }
-    ])
-    synth.validate(data)
-
-    # Run
-    synth.fit(data)
-    sampled = synth.sample(10)
-
-    # Assert
-    expected_sampled = pd.DataFrame({
-        'A': {
-            0: '2020-01-02',
-            1: '2019-10-30',
-            2: np.nan,
-            3: np.nan,
-            4: '2020-01-02',
-            5: np.nan,
-            6: '2019-10-30',
-            7: np.nan,
-            8: '2020-01-02',
-            9: np.nan
-        },
-        'B': {
-            0: '2021-12-30',
-            1: '2021-10-27',
-            2: '2021-10-27',
-            3: '2021-10-27',
-            4: np.nan,
-            5: '2021-10-27',
-            6: '2021-10-27',
-            7: '2021-12-30',
-            8: np.nan,
-            9: '2021-10-27'
-        }
-    })
-    pd.testing.assert_frame_equal(expected_sampled, sampled)
-
-
-def test_scalar_inequality_constraint_with_datetimes_and_nones():
-    """Test that the ``ScalarInequality`` constraint works with ``None`` and ``datetime``."""
-    # Setup
-    data = pd.DataFrame(data={
-        'A': [None, None, '2020-01-02', '2020-03-04'],
-        'B': [None, '2021-03-04', '2021-12-31', None]
-    })
-
-    metadata = SingleTableMetadata.load_from_dict({
-        'columns': {
-            'A': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
-            'B': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'}
-        }
-    })
-
-    metadata.validate()
-    synth = GaussianCopulaSynthesizer(metadata)
-    synth.add_constraints([
-        {
-            'constraint_class': 'ScalarInequality',
-            'constraint_parameters': {
-                'column_name': 'A',
-                'relation': '>=',
-                'value': '2019-01-01'
-            }
-        }
-    ])
-    synth.validate(data)
-
-    # Run
-    synth.fit(data)
-    sampled = synth.sample(5)
-
-    # Assert
-    expected_sampled = pd.DataFrame({
-        'A': {
-            0: np.nan,
-            1: '2020-01-19',
-            2: np.nan,
-            3: '2020-01-29',
-            4: '2020-01-31',
-        },
-        'B': {
-            0: '2021-07-28',
-            1: '2021-07-14',
-            2: '2021-07-26',
-            3: '2021-07-02',
-            4: '2021-06-06',
-        }
-    })
-    pd.testing.assert_frame_equal(expected_sampled, sampled)
-
-
-def test_scalar_range_constraint_with_datetimes_and_nones():
-    """Test that the ``ScalarRange`` constraint works with ``None`` and ``datetime``."""
-    # Setup
-    data = pd.DataFrame(data={
-        'A': [None, None, '2020-01-02', '2020-03-04'],
-        'B': [None, '2021-03-04', '2021-12-31', None]
-    })
-
-    metadata = SingleTableMetadata.load_from_dict({
-        'columns': {
-            'A': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
-            'B': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'}
-        }
-    })
-
-    metadata.validate()
-    synth = GaussianCopulaSynthesizer(metadata)
-    synth.add_constraints([
-        {
-            'constraint_class': 'ScalarRange',
-            'constraint_parameters': {
-                'column_name': 'A',
-                'low_value': '2019-10-30',
-                'high_value': '2020-03-04',
-                'strict_boundaries': False
-            }
-        }
-    ])
-    synth.validate(data)
-
-    # Run
-    synth.fit(data)
-    sampled = synth.sample(10)
-
-    # Assert
-    expected_sampled = pd.DataFrame({
-        'A': {
-            0: '2020-03-03',
-            1: np.nan,
-            2: '2020-03-03',
-            3: np.nan,
-            4: np.nan,
-            5: '2020-03-03',
-            6: np.nan,
-            7: np.nan,
-            8: np.nan,
-            9: '2020-02-27',
-        },
-        'B': {
-            0: np.nan,
-            1: np.nan,
-            2: np.nan,
-            3: np.nan,
-            4: np.nan,
-            5: '2021-04-14',
-            6: np.nan,
-            7: '2021-05-21',
-            8: np.nan,
-            9: np.nan,
-        }
-    })
-    pd.testing.assert_frame_equal(expected_sampled, sampled)
-
-
-def test_range_constraint_with_datetimes_and_nones():
-    """Test that the ``Range`` constraint works with ``None`` and ``datetime``."""
-    # Setup
-    data = pd.DataFrame(data={
-        'A': [None, None, '2020-01-02', '2020-03-04'],
-        'B': [None, '2021-03-04', '2021-12-31', None],
-        'C': [None, '2022-03-04', '2022-12-31', None],
-    })
-
-    metadata = SingleTableMetadata.load_from_dict({
-        'columns': {
-            'A': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
-            'B': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
-            'C': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'}
-        }
-    })
-
-    metadata.validate()
-    synth = GaussianCopulaSynthesizer(metadata)
-    synth.add_constraints([
-        {
-            'constraint_class': 'Range',
-            'constraint_parameters': {
-                'low_column_name': 'A',
-                'middle_column_name': 'B',
-                'high_column_name': 'C',
-                'strict_boundaries': False
-            }
-        }
-    ])
-    synth.validate(data)
-
-    # Run
-    synth.fit(data)
-    sampled = synth.sample(10)
-
-    # Assert
-    expected_sampled = pd.DataFrame({
-        'A': {
-            0: '2020-01-02',
-            1: '2020-01-02',
-            2: np.nan,
-            3: '2020-01-02',
-            4: '2019-10-30',
-            5: np.nan,
-            6: '2020-01-02',
-            7: '2019-10-30',
-            8: '2019-10-30',
-            9: np.nan
-        },
-        'B': {
-            0: '2021-12-30',
-            1: '2021-12-30',
-            2: '2021-10-27',
-            3: np.nan,
-            4: '2021-10-27',
-            5: '2021-10-27',
-            6: np.nan,
-            7: '2021-10-27',
-            8: np.nan,
-            9: '2021-10-27'
-        },
-        'C': {
-            0: '2022-12-30',
-            1: '2022-12-30',
-            2: '2022-10-27',
-            3: np.nan,
-            4: '2022-10-27',
-            5: '2022-10-27',
-            6: np.nan,
-            7: '2022-10-27',
-            8: np.nan,
-            9: '2022-10-27'
-        }
-    })
-    pd.testing.assert_frame_equal(expected_sampled, sampled)
-
-
-def test_inequality_constraint_all_possible_nans_configurations():
-    """Test that the inequality constraint works with all possible NaN configurations."""
-    # Setup
-    data = pd.DataFrame(data={
-        'A': [0, 1, np.nan, np.nan, 2],
-        'B': [2, np.nan, 3, np.nan, 3]
-    })
-
-    metadata = SingleTableMetadata.load_from_dict({
-        'columns': {
-            'A': {'sdtype': 'numerical'},
-            'B': {'sdtype': 'numerical'},
-        }
-    })
-
-    synthesizer = GaussianCopulaSynthesizer(metadata)
-    synthesizer.add_constraints(
-        [
-            {
-                'constraint_class': 'Inequality',
-                'constraint_parameters': {
-                    'low_column_name': 'A',
-                    'high_column_name': 'B'
-                }
-            }
-        ]
-    )
-
-    # Run
-    synthesizer.fit(data)
-    synthetic_data = synthesizer.sample(10000)
-
-    # Assert
-    assert (~(pd.isna(synthetic_data['A'])) & ~(pd.isna(synthetic_data['B']))).any()
-    assert ((pd.isna(synthetic_data['A'])) & ~(pd.isna(synthetic_data['B']))).any()
-    assert (~(pd.isna(synthetic_data['A'])) & (pd.isna(synthetic_data['B']))).any()
-    assert (~(pd.isna(synthetic_data['A'])) & ~(pd.isna(synthetic_data['B']))).any()
-
-
-def test_range_constraint_all_possible_nans_configurations():
-    """Test that the range constraint works with all possible NaN configurations."""
-    # Setup
-    data = pd.DataFrame(data={
-        'low': [1, 4, np.nan, 0, 4, np.nan, np.nan, 5, np.nan],
-        'middle': [2, 5, 3, np.nan, 5, np.nan, 5, np.nan, np.nan],
-        'high': [3, 7, 8, 4, np.nan, 9, np.nan, np.nan, np.nan]
-    })
-
-    metadata_dict = {
-        'columns': {
-            'low': {'sdtype': 'numerical'},
-            'middle': {'sdtype': 'numerical'},
-            'high': {'sdtype': 'numerical'}
-        }
-    }
-
-    metadata = SingleTableMetadata.load_from_dict(metadata_dict)
-    synthesizer = GaussianCopulaSynthesizer(metadata)
-
-    my_constraint = {
-        'constraint_class': 'Range',
-        'constraint_parameters': {
-            'low_column_name': 'low',
-            'middle_column_name': 'middle',
-            'high_column_name': 'high'
-        }
-    }
-
-    # Run
-    synthesizer.add_constraints(constraints=[my_constraint])
-    synthesizer.fit(data)
-
-    s_data = synthesizer.sample(2000)
-
-    # Assert
-    synt_data_not_nan_low_middle = s_data[~(pd.isna(s_data['low'])) & ~(pd.isna(s_data['middle']))]
-    synt_data_not_nan_middle_high = s_data[
-        ~(pd.isna(s_data['middle'])) & ~(pd.isna(s_data['high']))
-    ]
-    synt_data_not_nan_low_high = s_data[~(pd.isna(s_data['low'])) & ~(pd.isna(s_data['high']))]
-
-    is_nan_low = pd.isna(s_data['low'])
-    is_nan_middle = pd.isna(s_data['middle'])
-    is_nan_high = pd.isna(s_data['high'])
-
-    assert all(synt_data_not_nan_low_middle['low'] <= synt_data_not_nan_low_middle['middle'])
-    assert all(synt_data_not_nan_middle_high['middle'] <= synt_data_not_nan_middle_high['high'])
-    assert all(synt_data_not_nan_low_high['low'] <= synt_data_not_nan_low_high['high'])
-
-    assert any(is_nan_low & is_nan_middle & is_nan_high)
-    assert any(is_nan_low & is_nan_middle & ~is_nan_high)
-    assert any(is_nan_low & ~is_nan_middle & is_nan_high)
-    assert any(is_nan_low & ~is_nan_middle & ~is_nan_high)
-    assert any(~is_nan_low & is_nan_middle & is_nan_high)
-    assert any(~is_nan_low & is_nan_middle & ~is_nan_high)
-    assert any(~is_nan_low & ~is_nan_middle & is_nan_high)
-    assert any(~is_nan_low & ~is_nan_middle & ~is_nan_high)
-
-
 def test_save_and_load(tmp_path):
     """Test that synthesizers can be saved and loaded properly."""
     # Setup
diff --git a/tests/integration/single_table/test_constraints.py b/tests/integration/single_table/test_constraints.py
new file mode 100644
index 000000000..4a1b51fd3
--- /dev/null
+++ b/tests/integration/single_table/test_constraints.py
@@ -0,0 +1,810 @@
+"""Module for testing single table synthesizers with constraints."""
+
+from unittest.mock import patch
+
+import numpy as np
+import pandas as pd
+from copulas.multivariate.gaussian import GaussianMultivariate
+
+from sdv.constraints import create_custom_constraint_class
+from sdv.datasets.demo import download_demo
+from sdv.metadata import SingleTableMetadata
+from sdv.sampling import Condition
+from sdv.single_table import GaussianCopulaSynthesizer
+from tests.integration.single_table.custom_constraints import MyConstraint
+
+
+def _isinstance_side_effect(*args, **kwargs):
+    if isinstance(args[0], GaussianMultivariate):
+        return True
+    else:
+        return isinstance(args[0], args[1])
+
+
+def test_fit_with_unique_constraint_on_data_with_only_index_column():
+    """Test that the ``fit`` method runs without error when metadata specifies unique constraint,
+    ``fit`` is called on data containing a column named index.
+
+    The ``fit`` method is expected to fit the model to data,
+    taking into account the metadata and the ``Unique`` constraint.
+
+    Setup:
+    - The model is passed the unique constraint and
+    the primary key column.
+
+    Input:
+    - Data, Unique constraint
+
+    Github Issue:
+    - Tests that https://github.com/sdv-dev/SDV/issues/616 does not occur
+    """
+    # Setup
+    test_df = pd.DataFrame({
+        'key': [
+            1,
+            2,
+            3,
+            4,
+            5,
+        ],
+        'index': [
+            'A',
+            'B',
+            'C',
+            'D',
+            'E',
+        ]
+    })
+
+    metadata = SingleTableMetadata()
+    metadata.add_column('key', sdtype='id')
+    metadata.add_column('index', sdtype='categorical')
+    metadata.set_primary_key('key')
+
+    model = GaussianCopulaSynthesizer(metadata)
+    constraint = {
+        'constraint_class': 'Unique',
+        'constraint_parameters': {
+            'column_names': ['index']
+        }
+    }
+    model.add_constraints([constraint])
+
+    # Run
+    model.fit(test_df)
+    samples = model.sample(2)
+
+    # Assert
+    assert len(samples) == 2
+    assert samples['index'].is_unique
+
+
+def test_fit_with_unique_constraint_on_data_which_has_index_column():
+    """Test that the ``fit`` method runs without error when metadata specifies unique constraint,
+    ``fit`` is called on data containing a column named index and other columns.
+
+    The ``fit`` method is expected to fit the model to data,
+    taking into account the metadata and the ``Unique`` constraint.
+
+    Setup:
+    - The model is passed the unique constraint and
+    the primary key column.
+    - The unique constraint is set on the ``test_column``
+
+    Input:
+    - Data, Unique constraint
+
+    Github Issue:
+    - Tests that https://github.com/sdv-dev/SDV/issues/616 does not occur
+    """
+    # Setup
+    test_df = pd.DataFrame({
+        'key': [
+            1,
+            2,
+            3,
+            4,
+            5,
+        ],
+        'index': [
+            'A',
+            'B',
+            'C',
+            'D',
+            'E',
+        ],
+        'test_column': [
+            'A1',
+            'B2',
+            'C3',
+            'D4',
+            'E5',
+        ]
+    })
+
+    metadata = SingleTableMetadata()
+    metadata.add_column('key', sdtype='id')
+    metadata.add_column('index', sdtype='categorical')
+    metadata.add_column('test_column', sdtype='categorical')
+    metadata.set_primary_key('key')
+
+    model = GaussianCopulaSynthesizer(metadata)
+    constraint = {
+        'constraint_class': 'Unique',
+        'constraint_parameters': {
+            'column_names': ['test_column']
+        }
+    }
+    model.add_constraints([constraint])
+
+    # Run
+    model.fit(test_df)
+    samples = model.sample(2)
+
+    # Assert
+    assert len(samples) == 2
+    assert samples['test_column'].is_unique
+
+
+def test_fit_with_unique_constraint_on_data_subset():
+    """Test that the ``fit`` method runs without error when metadata specifies unique constraint,
+    ``fit`` is called on a subset of the original data.
+
+    The ``fit`` method is expected to fit the model to the subset of data,
+    taking into account the metadata and the ``Unique`` constraint.
+
+    Setup:
+    - The model is passed a ``Unique`` constraint and is
+    matched to a subset of the specified data.
+    Subdividing the data results in missing indexes in the subset contained in the original data.
+
+    Input:
+    - Subset of data, unique constraint
+
+    Github Issue:
+    - Tests that https://github.com/sdv-dev/SDV/issues/610 does not occur
+    """
+    # Setup
+    test_df = pd.DataFrame({
+        'key': [
+            1,
+            2,
+            3,
+            4,
+            5,
+        ],
+        'test_column': [
+            'A',
+            'B',
+            'C',
+            'D',
+            'E',
+        ]
+    })
+
+    metadata = SingleTableMetadata()
+    metadata.add_column('key', sdtype='id')
+    metadata.add_column('test_column', sdtype='categorical')
+    metadata.set_primary_key('key')
+
+    test_df = test_df.iloc[[1, 3, 4]]
+    constraint = {
+        'constraint_class': 'Unique',
+        'constraint_parameters': {
+            'column_names': ['test_column']
+        }
+    }
+    model = GaussianCopulaSynthesizer(metadata)
+    model.add_constraints([constraint])
+
+    # Run
+    model.fit(test_df)
+    samples = model.sample(2)
+
+    # Assert
+    assert len(samples) == 2
+    assert samples['test_column'].is_unique
+
+
+@patch('sdv.single_table.base.isinstance')
+@patch('sdv.single_table.copulas.multivariate.GaussianMultivariate',
+       spec_set=GaussianMultivariate)
+def test_conditional_sampling_constraint_uses_reject_sampling(gm_mock, isinstance_mock):
+    """Test that the ``sample`` method handles constraints with conditions.
+
+    The ``sample`` method is expected to properly apply constraint
+    transformations by dropping columns that cannot be conditonally sampled
+    on due to them being part of a constraint.
+
+    Setup:
+    - The model is being passed a ``UniqueCombination`` constraint and then
+    asked to sample with two conditions, one of which the constraint depends on.
+    The constraint is expected to skip its transformations since only some of
+    the columns are provided by the conditions and the model will use reject
+    sampling to meet the constraint instead.
+
+    Input:
+    - Conditions
+    Side Effects:
+    - Correct columns to condition on are passed to underlying sample method
+    """
+    # Setup
+    isinstance_mock.side_effect = _isinstance_side_effect
+    data = pd.DataFrame({
+        'city': ['LA', 'SF', 'CHI', 'LA', 'LA'],
+        'state': ['CA', 'CA', 'IL', 'CA', 'CA'],
+        'age': [27, 28, 26, 21, 30]
+    })
+
+    metadata = SingleTableMetadata()
+    metadata.add_column('city', sdtype='categorical')
+    metadata.add_column('state', sdtype='categorical')
+    metadata.add_column('age', sdtype='numerical')
+
+    model = GaussianCopulaSynthesizer(metadata)
+
+    constraint = {
+        'constraint_class': 'FixedCombinations',
+        'constraint_parameters': {
+            'column_names': ['city', 'state']
+        }
+    }
+    model.add_constraints([constraint])
+    sampled_numeric_data = [
+        pd.DataFrame({
+            'city#state': [0, 1, 2, 0, 0],
+            'age': [30, 30, 30, 30, 30]
+        }),
+        pd.DataFrame({
+            'city#state': [1],
+            'age': [30]
+        })
+    ]
+    gm_mock.return_value.sample.side_effect = sampled_numeric_data
+    model.fit(data)
+
+    # Run
+    conditions = [Condition({'age': 30, 'state': 'CA'}, num_rows=5)]
+    sampled_data = model.sample_from_conditions(conditions=conditions)
+
+    # Assert
+    expected_transformed_conditions = {'age': 30}
+    expected_data = pd.DataFrame({
+        'city': ['LA', 'SF', 'LA', 'LA', 'SF'],
+        'state': ['CA', 'CA', 'CA', 'CA', 'CA'],
+        'age': [30, 30, 30, 30, 30]
+    })
+    sample_calls = model._model.sample.mock_calls
+    assert len(sample_calls) == 2
+    model._model.sample.assert_any_call(5, conditions=expected_transformed_conditions)
+    pd.testing.assert_frame_equal(sampled_data, expected_data)
+
+
+def test_custom_constraints_from_file(tmpdir):
+    """Ensure the correct loading for a custom constraint class defined in another file."""
+    data = pd.DataFrame({
+        'primary_key': ['user-000', 'user-001', 'user-002'],
+        'pii_col': ['223 Williams Rd', '75 Waltham St', '77 Mass Ave'],
+        'numerical_col': [2, 3, 4],
+        'categorical_col': ['a', 'b', 'a'],
+    })
+
+    metadata = SingleTableMetadata()
+    metadata.detect_from_dataframe(data)
+    metadata.update_column(column_name='pii_col', sdtype='address', pii=True)
+    synthesizer = GaussianCopulaSynthesizer(
+        metadata,
+        enforce_min_max_values=False,
+        enforce_rounding=False
+    )
+    synthesizer.load_custom_constraint_classes(
+        'tests/integration/single_table/custom_constraints.py',
+        ['MyConstraint']
+    )
+    constraint = {
+        'constraint_class': 'MyConstraint',
+        'constraint_parameters': {
+            'column_names': ['numerical_col']
+        }
+    }
+
+    # Run
+    synthesizer.add_constraints([constraint])
+    processed_data = synthesizer.preprocess(data)
+
+    # Assert Processed Data
+    assert all(processed_data['numerical_col'] == data['numerical_col'] ** 2)
+
+    # Run - Fit the model
+    synthesizer.fit_processed_data(processed_data)
+
+    # Run - sample
+    sampled = synthesizer.sample(10)
+    assert all(sampled['numerical_col'] > 1)
+
+    # Run - Save and Sample
+    synthesizer.save(tmpdir / 'test.pkl')
+    loaded_instance = synthesizer.load(tmpdir / 'test.pkl')
+    loaded_sampled = loaded_instance.sample(10)
+    assert all(loaded_sampled['numerical_col'] > 1)
+
+
+def test_custom_constraints_from_object(tmpdir):
+    """Ensure the correct loading for a custom constraint class passed as an object."""
+    data = pd.DataFrame({
+        'primary_key': ['user-000', 'user-001', 'user-002'],
+        'pii_col': ['223 Williams Rd', '75 Waltham St', '77 Mass Ave'],
+        'numerical_col': [2, 3, 4],
+        'categorical_col': ['a', 'b', 'a'],
+    })
+
+    metadata = SingleTableMetadata()
+    metadata.detect_from_dataframe(data)
+    metadata.update_column(column_name='pii_col', sdtype='address', pii=True)
+    synthesizer = GaussianCopulaSynthesizer(
+        metadata,
+        enforce_min_max_values=False,
+        enforce_rounding=False
+    )
+    synthesizer.add_custom_constraint_class(MyConstraint, 'MyConstraint')
+    constraint = {
+        'constraint_class': 'MyConstraint',
+        'constraint_parameters': {
+            'column_names': ['numerical_col']
+        }
+    }
+
+    # Run
+    synthesizer.add_constraints([constraint])
+    processed_data = synthesizer.preprocess(data)
+
+    # Assert Processed Data
+    assert all(processed_data['numerical_col'] == data['numerical_col'] ** 2)
+
+    # Run - Fit the model
+    synthesizer.fit_processed_data(processed_data)
+
+    # Run - sample
+    sampled = synthesizer.sample(10)
+    assert all(sampled['numerical_col'] > 1)
+
+    # Run - Save and Sample
+    synthesizer.save(tmpdir / 'test.pkl')
+    loaded_instance = synthesizer.load(tmpdir / 'test.pkl')
+    loaded_sampled = loaded_instance.sample(10)
+    assert all(loaded_sampled['numerical_col'] > 1)
+
+
+def test_synthesizer_with_inequality_constraint():
+    """Ensure that the ``Inequality`` constraint can sample from the model."""
+    # Setup
+    real_data, metadata = download_demo(
+        modality='single_table',
+        dataset_name='fake_hotel_guests'
+    )
+    synthesizer = GaussianCopulaSynthesizer(metadata)
+    checkin_lessthan_checkout = {
+        'constraint_class': 'Inequality',
+        'constraint_parameters': {
+            'low_column_name': 'checkin_date',
+            'high_column_name': 'checkout_date'
+        }
+    }
+
+    synthesizer.add_constraints([checkin_lessthan_checkout])
+    synthesizer.fit(real_data)
+
+    # Run and Assert
+    sampled = synthesizer.sample(num_rows=500)
+    synthesizer.validate(sampled)
+    _sampled = sampled[~sampled['checkout_date'].isna()]
+    assert all(
+        pd.to_datetime(_sampled['checkin_date']) < pd.to_datetime(_sampled['checkout_date'])
+    )
+
+
+def test_inequality_constraint_with_datetimes_and_nones():
+    """Test that the ``Inequality`` constraint works with ``None`` and ``datetime``."""
+    # Setup
+    data = pd.DataFrame(data={
+        'A': [None, None, '2020-01-02', '2020-03-04'] * 2,
+        'B': [None, '2021-03-04', '2021-12-31', None] * 2
+    })
+
+    metadata = SingleTableMetadata.load_from_dict({
+        'columns': {
+            'A': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
+            'B': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'}
+        }
+    })
+
+    metadata.validate()
+    synth = GaussianCopulaSynthesizer(metadata)
+    synth.add_constraints([
+        {
+            'constraint_class': 'Inequality',
+            'constraint_parameters': {
+                'low_column_name': 'A',
+                'high_column_name': 'B'
+            }
+        }
+    ])
+    synth.validate(data)
+
+    # Run
+    synth.fit(data)
+    sampled = synth.sample(10)
+
+    # Assert
+    expected_sampled = pd.DataFrame({
+        'A': {
+            0: '2020-01-02',
+            1: '2019-10-30',
+            2: np.nan,
+            3: np.nan,
+            4: '2020-01-02',
+            5: np.nan,
+            6: '2019-10-30',
+            7: np.nan,
+            8: '2020-01-02',
+            9: np.nan
+        },
+        'B': {
+            0: '2021-12-30',
+            1: '2021-10-27',
+            2: '2021-10-27',
+            3: '2021-10-27',
+            4: np.nan,
+            5: '2021-10-27',
+            6: '2021-10-27',
+            7: '2021-12-30',
+            8: np.nan,
+            9: '2021-10-27'
+        }
+    })
+    pd.testing.assert_frame_equal(expected_sampled, sampled)
+
+
+def test_scalar_inequality_constraint_with_datetimes_and_nones():
+    """Test that the ``ScalarInequality`` constraint works with ``None`` and ``datetime``."""
+    # Setup
+    data = pd.DataFrame(data={
+        'A': [None, None, '2020-01-02', '2020-03-04'],
+        'B': [None, '2021-03-04', '2021-12-31', None]
+    })
+
+    metadata = SingleTableMetadata.load_from_dict({
+        'columns': {
+            'A': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
+            'B': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'}
+        }
+    })
+
+    metadata.validate()
+    synth = GaussianCopulaSynthesizer(metadata)
+    synth.add_constraints([
+        {
+            'constraint_class': 'ScalarInequality',
+            'constraint_parameters': {
+                'column_name': 'A',
+                'relation': '>=',
+                'value': '2019-01-01'
+            }
+        }
+    ])
+    synth.validate(data)
+
+    # Run
+    synth.fit(data)
+    sampled = synth.sample(5)
+
+    # Assert
+    expected_sampled = pd.DataFrame({
+        'A': {
+            0: np.nan,
+            1: '2020-01-19',
+            2: np.nan,
+            3: '2020-01-29',
+            4: '2020-01-31',
+        },
+        'B': {
+            0: '2021-07-28',
+            1: '2021-07-14',
+            2: '2021-07-26',
+            3: '2021-07-02',
+            4: '2021-06-06',
+        }
+    })
+    pd.testing.assert_frame_equal(expected_sampled, sampled)
+
+
+def test_scalar_range_constraint_with_datetimes_and_nones():
+    """Test that the ``ScalarRange`` constraint works with ``None`` and ``datetime``."""
+    # Setup
+    data = pd.DataFrame(data={
+        'A': [None, None, '2020-01-02', '2020-03-04'],
+        'B': [None, '2021-03-04', '2021-12-31', None]
+    })
+
+    metadata = SingleTableMetadata.load_from_dict({
+        'columns': {
+            'A': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
+            'B': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'}
+        }
+    })
+
+    metadata.validate()
+    synth = GaussianCopulaSynthesizer(metadata)
+    synth.add_constraints([
+        {
+            'constraint_class': 'ScalarRange',
+            'constraint_parameters': {
+                'column_name': 'A',
+                'low_value': '2019-10-30',
+                'high_value': '2020-03-04',
+                'strict_boundaries': False
+            }
+        }
+    ])
+    synth.validate(data)
+
+    # Run
+    synth.fit(data)
+    sampled = synth.sample(10)
+
+    # Assert
+    expected_sampled = pd.DataFrame({
+        'A': {
+            0: '2020-03-03',
+            1: np.nan,
+            2: '2020-03-03',
+            3: np.nan,
+            4: np.nan,
+            5: '2020-03-03',
+            6: np.nan,
+            7: np.nan,
+            8: np.nan,
+            9: '2020-02-27',
+        },
+        'B': {
+            0: np.nan,
+            1: np.nan,
+            2: np.nan,
+            3: np.nan,
+            4: np.nan,
+            5: '2021-04-14',
+            6: np.nan,
+            7: '2021-05-21',
+            8: np.nan,
+            9: np.nan,
+        }
+    })
+    pd.testing.assert_frame_equal(expected_sampled, sampled)
+
+
+def test_range_constraint_with_datetimes_and_nones():
+    """Test that the ``Range`` constraint works with ``None`` and ``datetime``."""
+    # Setup
+    data = pd.DataFrame(data={
+        'A': [None, None, '2020-01-02', '2020-03-04'],
+        'B': [None, '2021-03-04', '2021-12-31', None],
+        'C': [None, '2022-03-04', '2022-12-31', None],
+    })
+
+    metadata = SingleTableMetadata.load_from_dict({
+        'columns': {
+            'A': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
+            'B': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'},
+            'C': {'sdtype': 'datetime', 'datetime_format': '%Y-%m-%d'}
+        }
+    })
+
+    metadata.validate()
+    synth = GaussianCopulaSynthesizer(metadata)
+    synth.add_constraints([
+        {
+            'constraint_class': 'Range',
+            'constraint_parameters': {
+                'low_column_name': 'A',
+                'middle_column_name': 'B',
+                'high_column_name': 'C',
+                'strict_boundaries': False
+            }
+        }
+    ])
+    synth.validate(data)
+
+    # Run
+    synth.fit(data)
+    sampled = synth.sample(10)
+
+    # Assert
+    expected_sampled = pd.DataFrame({
+        'A': {
+            0: '2020-01-02',
+            1: '2020-01-02',
+            2: np.nan,
+            3: '2020-01-02',
+            4: '2019-10-30',
+            5: np.nan,
+            6: '2020-01-02',
+            7: '2019-10-30',
+            8: '2019-10-30',
+            9: np.nan
+        },
+        'B': {
+            0: '2021-12-30',
+            1: '2021-12-30',
+            2: '2021-10-27',
+            3: np.nan,
+            4: '2021-10-27',
+            5: '2021-10-27',
+            6: np.nan,
+            7: '2021-10-27',
+            8: np.nan,
+            9: '2021-10-27'
+        },
+        'C': {
+            0: '2022-12-30',
+            1: '2022-12-30',
+            2: '2022-10-27',
+            3: np.nan,
+            4: '2022-10-27',
+            5: '2022-10-27',
+            6: np.nan,
+            7: '2022-10-27',
+            8: np.nan,
+            9: '2022-10-27'
+        }
+    })
+    pd.testing.assert_frame_equal(expected_sampled, sampled)
+
+
+def test_inequality_constraint_all_possible_nans_configurations():
+    """Test that the inequality constraint works with all possible NaN configurations."""
+    # Setup
+    data = pd.DataFrame(data={
+        'A': [0, 1, np.nan, np.nan, 2],
+        'B': [2, np.nan, 3, np.nan, 3]
+    })
+
+    metadata = SingleTableMetadata.load_from_dict({
+        'columns': {
+            'A': {'sdtype': 'numerical'},
+            'B': {'sdtype': 'numerical'},
+        }
+    })
+
+    synthesizer = GaussianCopulaSynthesizer(metadata)
+    synthesizer.add_constraints(
+        [
+            {
+                'constraint_class': 'Inequality',
+                'constraint_parameters': {
+                    'low_column_name': 'A',
+                    'high_column_name': 'B'
+                }
+            }
+        ]
+    )
+
+    # Run
+    synthesizer.fit(data)
+    synthetic_data = synthesizer.sample(10000)
+
+    # Assert
+    assert (~(pd.isna(synthetic_data['A'])) & ~(pd.isna(synthetic_data['B']))).any()
+    assert ((pd.isna(synthetic_data['A'])) & ~(pd.isna(synthetic_data['B']))).any()
+    assert (~(pd.isna(synthetic_data['A'])) & (pd.isna(synthetic_data['B']))).any()
+    assert (~(pd.isna(synthetic_data['A'])) & ~(pd.isna(synthetic_data['B']))).any()
+
+
+def test_range_constraint_all_possible_nans_configurations():
+    """Test that the range constraint works with all possible NaN configurations."""
+    # Setup
+    data = pd.DataFrame(data={
+        'low': [1, 4, np.nan, 0, 4, np.nan, np.nan, 5, np.nan],
+        'middle': [2, 5, 3, np.nan, 5, np.nan, 5, np.nan, np.nan],
+        'high': [3, 7, 8, 4, np.nan, 9, np.nan, np.nan, np.nan]
+    })
+
+    metadata_dict = {
+        'columns': {
+            'low': {'sdtype': 'numerical'},
+            'middle': {'sdtype': 'numerical'},
+            'high': {'sdtype': 'numerical'}
+        }
+    }
+
+    metadata = SingleTableMetadata.load_from_dict(metadata_dict)
+    synthesizer = GaussianCopulaSynthesizer(metadata)
+
+    my_constraint = {
+        'constraint_class': 'Range',
+        'constraint_parameters': {
+            'low_column_name': 'low',
+            'middle_column_name': 'middle',
+            'high_column_name': 'high'
+        }
+    }
+
+    # Run
+    synthesizer.add_constraints(constraints=[my_constraint])
+    synthesizer.fit(data)
+
+    s_data = synthesizer.sample(2000)
+
+    # Assert
+    synt_data_not_nan_low_middle = s_data[~(pd.isna(s_data['low'])) & ~(pd.isna(s_data['middle']))]
+    synt_data_not_nan_middle_high = s_data[
+        ~(pd.isna(s_data['middle'])) & ~(pd.isna(s_data['high']))
+    ]
+    synt_data_not_nan_low_high = s_data[~(pd.isna(s_data['low'])) & ~(pd.isna(s_data['high']))]
+
+    is_nan_low = pd.isna(s_data['low'])
+    is_nan_middle = pd.isna(s_data['middle'])
+    is_nan_high = pd.isna(s_data['high'])
+
+    assert all(synt_data_not_nan_low_middle['low'] <= synt_data_not_nan_low_middle['middle'])
+    assert all(synt_data_not_nan_middle_high['middle'] <= synt_data_not_nan_middle_high['high'])
+    assert all(synt_data_not_nan_low_high['low'] <= synt_data_not_nan_low_high['high'])
+
+    assert any(is_nan_low & is_nan_middle & is_nan_high)
+    assert any(is_nan_low & is_nan_middle & ~is_nan_high)
+    assert any(is_nan_low & ~is_nan_middle & is_nan_high)
+    assert any(is_nan_low & ~is_nan_middle & ~is_nan_high)
+    assert any(~is_nan_low & is_nan_middle & is_nan_high)
+    assert any(~is_nan_low & is_nan_middle & ~is_nan_high)
+    assert any(~is_nan_low & ~is_nan_middle & is_nan_high)
+    assert any(~is_nan_low & ~is_nan_middle & ~is_nan_high)
+
+
+def test_custom_constraint_with_key():
+    """Test that a custom constraint can work with a primary key."""
+    # Setup
+    def is_valid(column_names, data):
+        return data['key'] == data['letter'] + '_' + data['number']
+
+    def transform(column_names, data):
+        new_data = data.drop(['letter', 'number'], axis=1)
+        return new_data
+
+    def reverse_transform(column_names, data):
+        columns = data['key'].str.split('_', expand=True)
+        data['letter'] = columns[0]
+        data['number'] = columns[1]
+        return data
+
+    custom_constraint = create_custom_constraint_class(
+        is_valid_fn=is_valid,
+        transform_fn=transform,
+        reverse_transform_fn=reverse_transform
+    )
+
+    data = pd.DataFrame({
+        'key': ['a_1', 'b_2', 'c_3'],
+        'letter': ['a', 'b', 'c'],
+        'number': ['1', '2', '3'],
+        'other': [7, 8, 9]
+    })
+    metadata = SingleTableMetadata()
+    metadata.detect_from_dataframe(data)
+    metadata.update_column('key', sdtype='id', regex_format=r'\w_\d')
+    metadata.set_primary_key('key')
+    synth = GaussianCopulaSynthesizer(metadata)
+    synth.add_custom_constraint_class(custom_constraint, 'custom')
+
+    id_must_match = {
+        'constraint_class': 'custom',
+        'constraint_parameters': {
+            'column_names': ['letter', 'number'],
+        }
+    }
+    synth.add_constraints([id_must_match])
+
+    # Run
+    synth.fit(data)
+    sampled = synth.sample(100)
+
+    # Assert
+    synth.validate(sampled)

From 794c5e5fa4c6626ebd3934c7d50f975213943723 Mon Sep 17 00:00:00 2001
From: Andrew Montanez <amontanez2424@gmail.com>
Date: Fri, 28 Jul 2023 15:42:00 -0500
Subject: [PATCH 2/4] adding key columns before reversing constraints

---
 sdv/data_processing/data_processor.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/sdv/data_processing/data_processor.py b/sdv/data_processing/data_processor.py
index 563c9aa81..46b45c762 100644
--- a/sdv/data_processing/data_processor.py
+++ b/sdv/data_processing/data_processor.py
@@ -716,6 +716,7 @@ def reverse_transform(self, data, reset_keys=False):
         if self._keys and num_rows:
             generated_keys = self.generate_keys(num_rows, reset_keys)
             sampled_columns.extend(self._keys)
+            reversed_data[generated_keys.columns] = generated_keys[generated_keys.notna()]
 
         for constraint in reversed(self._constraints_to_reverse):
             reversed_data = constraint.reverse_transform(reversed_data)

From 8cc966cdb341ad393ace7dd519e5674f16a846cf Mon Sep 17 00:00:00 2001
From: Andrew Montanez <amontanez2424@gmail.com>
Date: Fri, 28 Jul 2023 16:57:29 -0500
Subject: [PATCH 3/4] adding unit tests

---
 sdv/data_processing/data_processor.py         |  1 +
 .../data_processing/test_data_processor.py    | 41 +++++++++++++------
 2 files changed, 29 insertions(+), 13 deletions(-)

diff --git a/sdv/data_processing/data_processor.py b/sdv/data_processing/data_processor.py
index 46b45c762..badc9a5a4 100644
--- a/sdv/data_processing/data_processor.py
+++ b/sdv/data_processing/data_processor.py
@@ -712,6 +712,7 @@ def reverse_transform(self, data, reset_keys=False):
                 column_names=missing_columns
             )
             sampled_columns.extend(missing_columns)
+            reversed_data[anonymized_data.columns] = anonymized_data[anonymized_data.notna()]
 
         if self._keys and num_rows:
             generated_keys = self.generate_keys(num_rows, reset_keys)
diff --git a/tests/unit/data_processing/test_data_processor.py b/tests/unit/data_processing/test_data_processor.py
index abc39732b..35a589a46 100644
--- a/tests/unit/data_processing/test_data_processor.py
+++ b/tests/unit/data_processing/test_data_processor.py
@@ -17,6 +17,7 @@
 from sdv.errors import SynthesizerInputError
 from sdv.metadata.single_table import SingleTableMetadata
 from sdv.single_table.base import BaseSynthesizer
+from tests.utils import DataFrameMatcher
 
 
 class TestDataProcessor:
@@ -1821,7 +1822,7 @@ def test__transform_constraints_is_condition_false_returns_data(self):
         assert result.equals(expected_result)
         assert dp._constraints_to_reverse == []
 
-    def test_reverse_transform(self):
+    def test_reverse_transform_blah(self):
         """Test the ``reverse_transform`` method.
 
         This method should attempt to reverse transform all the columns using the
@@ -1846,21 +1847,26 @@ def test_reverse_transform(self):
         dp = DataProcessor(SingleTableMetadata())
         dp.fitted = True
         dp.metadata = Mock()
-        dp.metadata.columns = {'a': None, 'b': None, 'c': None, 'd': None}
+        dp.metadata.columns = {'a': None, 'b': None, 'c': None, 'key': None, 'd': None}
         data = pd.DataFrame({
             'a': [1, 2, 3],
             'b': [True, True, False],
             'c': ['d', 'e', 'f'],
+
         })
+        dp._keys = ['key']
         dp._hyper_transformer = Mock()
-        dp._hyper_transformer.create_anonymized_columns.return_value = pd.DataFrame({
-            'd': ['a@gmail.com', 'b@gmail.com', 'c@gmail.com']
-        })
+        dp._hyper_transformer.create_anonymized_columns.side_effect = [
+            pd.DataFrame({'d': ['a@gmail.com', 'b@gmail.com', 'c@gmail.com']}),
+            pd.DataFrame({'key': ['sdv_0', 'sdv_1', 'sdv_2']})
+        ]
         dp._constraints_to_reverse = [constraint_mock]
-        dp._hyper_transformer.reverse_transform_subset.return_value = data
+        dp._hyper_transformer.reverse_transform_subset.return_value = data.copy()
         dp._hyper_transformer._output_columns = ['a', 'b', 'c']
         dp._dtypes = pd.Series(
-            [np.float64, np.bool_, np.object_, np.object_], index=['a', 'b', 'c', 'd'])
+            [np.float64, np.bool_, np.object_, np.object_, np.object_],
+            index=['a', 'b', 'c', 'd', 'key']
+        )
         constraint_mock.reverse_transform.return_value = data
 
         # Run
@@ -1872,20 +1878,29 @@ def test_reverse_transform(self):
             'b': [True, True, False],
             'c': ['d', 'e', 'f']
         })
-        constraint_mock.reverse_transform.assert_called_once_with(data)
+        expected_constraint_input = pd.DataFrame({
+            'a': [1, 2, 3],
+            'b': [True, True, False],
+            'c': ['d', 'e', 'f'],
+            'd': ['a@gmail.com', 'b@gmail.com', 'c@gmail.com'],
+            'key': ['sdv_0', 'sdv_1', 'sdv_2']
+        })
+        constraint_mock.reverse_transform.assert_called_once_with(
+            DataFrameMatcher(expected_constraint_input))
         data_from_call = dp._hyper_transformer.reverse_transform_subset.mock_calls[0][1][0]
         pd.testing.assert_frame_equal(input_data, data_from_call)
         dp._hyper_transformer.reverse_transform_subset.assert_called_once()
+        dp._hyper_transformer.create_anonymized_columns.has_calls(
+            call(num_rows=3, column_names=['d']),
+            call(num_rows=3, column_names=['key'])
+        )
         expected_output = pd.DataFrame({
             'a': [1., 2., 3.],
             'b': [True, True, False],
             'c': ['d', 'e', 'f'],
-            'd': ['a@gmail.com', 'b@gmail.com', 'c@gmail.com']
+            'key': ['sdv_0', 'sdv_1', 'sdv_2'],
+            'd': ['a@gmail.com', 'b@gmail.com', 'c@gmail.com'],
         })
-        dp._hyper_transformer.create_anonymized_columns.assert_called_once_with(
-            num_rows=3,
-            column_names=['d']
-        )
         pd.testing.assert_frame_equal(reverse_transformed, expected_output)
 
     @patch('sdv.data_processing.data_processor.LOGGER')

From ed4e9914ee3606aa2f71acc8c886430feeb6aeec Mon Sep 17 00:00:00 2001
From: Andrew Montanez <amontanez2424@gmail.com>
Date: Mon, 31 Jul 2023 11:34:40 -0500
Subject: [PATCH 4/4] renaming test

---
 tests/unit/data_processing/test_data_processor.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/unit/data_processing/test_data_processor.py b/tests/unit/data_processing/test_data_processor.py
index 35a589a46..9f8994323 100644
--- a/tests/unit/data_processing/test_data_processor.py
+++ b/tests/unit/data_processing/test_data_processor.py
@@ -1822,7 +1822,7 @@ def test__transform_constraints_is_condition_false_returns_data(self):
         assert result.equals(expected_result)
         assert dp._constraints_to_reverse == []
 
-    def test_reverse_transform_blah(self):
+    def test_reverse_transform(self):
         """Test the ``reverse_transform`` method.
 
         This method should attempt to reverse transform all the columns using the