Source code for evalml.demos.fraud
"""Load the credit card fraud dataset, which can be used for binary classification problems."""
import evalml
from evalml.preprocessing import load_data
[docs]def load_fraud(n_rows=None, verbose=True):
    """Load credit card fraud dataset.
    The fraud dataset can be used for binary classification problems.
    Args:
        n_rows (int): Number of rows from the dataset to return
        verbose (bool): Whether to print information about features and labels
    Returns:
        (pd.Dataframe, pd.Series): X and y
    """
    fraud_data_path = (
        "https://oss.alteryx.com/datasets/fraud_transactions.csv.gz?library=evalml&version="
        + evalml.__version__
    )
    X, y = load_data(
        path=fraud_data_path,
        index="id",
        target="fraud",
        compression="gzip",
        n_rows=n_rows,
        verbose=verbose,
    )
    X.ww.set_types(logical_types={"provider": "Categorical", "region": "Categorical"})
    return X, y