ML for Developers

2023-07-26 04:53:11 -07:00
commit 776a75b010
54 changed files with 55464 additions and 0 deletions
--- a/tests/code/conftest.py
+++ b/tests/code/conftest.py
@@ -0,0 +1,13 @@
+import pytest
+
+from madewithml.data import CustomPreprocessor
+
+
+@pytest.fixture
+def dataset_loc():
+    return "https://raw.githubusercontent.com/GokuMohandas/Made-With-ML/main/datasets/dataset.csv"
+
+
+@pytest.fixture
+def preprocessor():
+    return CustomPreprocessor()
--- a/tests/code/test_data.py
+++ b/tests/code/test_data.py
@@ -0,0 +1,58 @@
+import pandas as pd
+import pytest
+import ray
+
+from madewithml import data
+
+
+@pytest.fixture(scope="module")
+def df():
+    data = [{"title": "a0", "description": "b0", "tag": "c0"}]
+    df = pd.DataFrame(data)
+    return df
+
+
+@pytest.fixture(scope="module")
+def class_to_index():
+    class_to_index = {"c0": 0, "c1": 1}
+    return class_to_index
+
+
+def test_load_data(dataset_loc):
+    num_samples = 10
+    ds = data.load_data(dataset_loc=dataset_loc, num_samples=num_samples)
+    assert ds.count() == num_samples
+
+
+def test_stratify_split():
+    n_per_class = 10
+    targets = n_per_class * ["c1"] + n_per_class * ["c2"]
+    ds = ray.data.from_items([dict(target=t) for t in targets])
+    train_ds, test_ds = data.stratify_split(ds, stratify="target", test_size=0.5)
+    train_target_counts = train_ds.to_pandas().target.value_counts().to_dict()
+    test_target_counts = test_ds.to_pandas().target.value_counts().to_dict()
+    assert train_target_counts == test_target_counts
+
+
+@pytest.mark.parametrize(
+    "text, sw, clean_text",
+    [
+        ("hi", [], "hi"),
+        ("hi you", ["you"], "hi"),
+        ("hi yous", ["you"], "hi yous"),
+    ],
+)
+def test_clean_text(text, sw, clean_text):
+    assert data.clean_text(text=text, stopwords=sw) == clean_text
+
+
+def test_preprocess(df, class_to_index):
+    assert "text" not in df.columns
+    outputs = data.preprocess(df, class_to_index=class_to_index)
+    assert set(outputs) == {"ids", "masks", "targets"}
+
+
+def test_fit_transform(dataset_loc, preprocessor):
+    ds = data.load_data(dataset_loc=dataset_loc)
+    preprocessor.fit_transform(ds)
+    assert len(preprocessor.class_to_index) == 4
--- a/tests/code/test_predict.py
+++ b/tests/code/test_predict.py
@@ -0,0 +1,11 @@
+from madewithml import predict
+
+
+def test_decode():
+    decoded = predict.decode(indices=[0, 1, 1], index_to_class={0: "x", 1: "y"})
+    assert decoded == ["x", "y", "y"]
+
+
+def test_format_prob():
+    d = predict.format_prob(prob=[0.1, 0.9], index_to_class={0: "x", 1: "y"})
+    assert d == {"x": 0.1, "y": 0.9}
--- a/tests/code/test_train.py
+++ b/tests/code/test_train.py
@@ -0,0 +1,27 @@
+import json
+
+import pytest
+import utils
+
+from madewithml import train
+
+
+@pytest.mark.training
+def test_train_model(dataset_loc):
+    experiment_name = utils.generate_experiment_name(prefix="test_train")
+    train_loop_config = {"dropout_p": 0.5, "lr": 1e-4, "lr_factor": 0.8, "lr_patience": 3}
+    result = train.train_model(
+        experiment_name=experiment_name,
+        dataset_loc=dataset_loc,
+        train_loop_config=json.dumps(train_loop_config),
+        num_workers=6,
+        cpu_per_worker=1,
+        gpu_per_worker=0,
+        num_epochs=2,
+        num_samples=512,
+        batch_size=256,
+        results_fp=None,
+    )
+    utils.delete_experiment(experiment_name=experiment_name)
+    train_loss_list = result.metrics_dataframe.to_dict()["train_loss"]
+    assert train_loss_list[0] > train_loss_list[1]  # loss decreased
--- a/tests/code/test_tune.py
+++ b/tests/code/test_tune.py
@@ -0,0 +1,37 @@
+import json
+
+import pytest
+import utils
+
+from madewithml import tune
+
+
+@pytest.mark.training
+def test_tune_models(dataset_loc):
+    num_runs = 2
+    experiment_name = utils.generate_experiment_name(prefix="test_tune")
+    initial_params = [
+        {
+            "train_loop_config": {
+                "dropout_p": 0.5,
+                "lr": 1e-4,
+                "lr_factor": 0.8,
+                "lr_patience": 3,
+            }
+        }
+    ]
+    results = tune.tune_models(
+        experiment_name=experiment_name,
+        dataset_loc=dataset_loc,
+        initial_params=json.dumps(initial_params),
+        num_workers=6,
+        cpu_per_worker=1,
+        gpu_per_worker=0,
+        num_runs=num_runs,
+        num_epochs=1,
+        num_samples=512,
+        batch_size=256,
+        results_fp=None,
+    )
+    utils.delete_experiment(experiment_name=experiment_name)
+    assert len(results.get_dataframe()) == num_runs
--- a/tests/code/test_utils.py
+++ b/tests/code/test_utils.py
@@ -0,0 +1,61 @@
+import tempfile
+from pathlib import Path
+
+import numpy as np
+import pytest
+import torch
+
+from madewithml import utils
+
+
+def test_set_seed():
+    utils.set_seeds()
+    a = np.random.randn(2, 3)
+    b = np.random.randn(2, 3)
+    utils.set_seeds()
+    x = np.random.randn(2, 3)
+    y = np.random.randn(2, 3)
+    assert np.array_equal(a, x)
+    assert np.array_equal(b, y)
+
+
+def test_save_and_load_dict():
+    with tempfile.TemporaryDirectory() as dp:
+        d = {"hello": "world"}
+        fp = Path(dp, "d.json")
+        utils.save_dict(d=d, path=fp)
+        d = utils.load_dict(path=fp)
+        assert d["hello"] == "world"
+
+
+def test_pad_array():
+    arr = np.array([[1, 2], [1, 2, 3]], dtype="object")
+    padded_arr = np.array([[1, 2, 0], [1, 2, 3]])
+    assert np.array_equal(utils.pad_array(arr), padded_arr)
+
+
+def test_collate_fn():
+    batch = {
+        "ids": np.array([[1, 2], [1, 2, 3]], dtype="object"),
+        "masks": np.array([[1, 1], [1, 1, 1]], dtype="object"),
+        "targets": np.array([3, 1]),
+    }
+    processed_batch = utils.collate_fn(batch)
+    expected_batch = {
+        "ids": torch.tensor([[1, 2, 0], [1, 2, 3]], dtype=torch.int32),
+        "masks": torch.tensor([[1, 1, 0], [1, 1, 1]], dtype=torch.int32),
+        "targets": torch.tensor([3, 1], dtype=torch.int64),
+    }
+    for k in batch:
+        assert torch.allclose(processed_batch[k], expected_batch[k])
+
+
+@pytest.mark.parametrize(
+    "d, keys, list",
+    [
+        ({"a": [1, 2], "b": [1, 2]}, ["a", "b"], [{"a": 1, "b": 1}, {"a": 2, "b": 2}]),
+        ({"a": [1, 2], "b": [1, 2]}, ["a"], [{"a": 1}, {"a": 2}]),
+    ],
+)
+def test_dict_to_list(d, keys, list):
+    assert utils.dict_to_list(d, keys=keys) == list
--- a/tests/code/utils.py
+++ b/tests/code/utils.py
@@ -0,0 +1,13 @@
+import uuid
+
+from madewithml.config import mlflow
+
+
+def generate_experiment_name(prefix: str = "test") -> str:
+    return f"{prefix}-{uuid.uuid4().hex[:8]}"
+
+
+def delete_experiment(experiment_name: str) -> None:
+    client = mlflow.tracking.MlflowClient()
+    experiment_id = client.get_experiment_by_name(experiment_name).experiment_id
+    client.delete_experiment(experiment_id=experiment_id)
--- a/tests/data/conftest.py
+++ b/tests/data/conftest.py
@@ -0,0 +1,17 @@
+import great_expectations as ge
+import pandas as pd
+import pytest
+
+
+def pytest_addoption(parser):
+    """Add option to specify dataset location when executing tests from CLI.
+    Ex: pytest --dataset-loc=$DATASET_LOC tests/data --verbose --disable-warnings
+    """
+    parser.addoption("--dataset-loc", action="store", default=None, help="Dataset location.")
+
+
+@pytest.fixture(scope="module")
+def df(request):
+    dataset_loc = request.config.getoption("--dataset-loc")
+    df = ge.dataset.PandasDataset(pd.read_csv(dataset_loc))
+    return df
--- a/tests/data/test_dataset.py
+++ b/tests/data/test_dataset.py
@@ -0,0 +1,15 @@
+def test_dataset(df):
+    """Test dataset quality and integrity."""
+    column_list = ["id", "created_on", "title", "description", "tag"]
+    df.expect_table_columns_to_match_ordered_list(column_list=column_list)  # schema adherence
+    tags = ["computer-vision", "natural-language-processing", "mlops", "other"]
+    df.expect_column_values_to_be_in_set(column="tag", value_set=tags)  # expected labels
+    df.expect_compound_columns_to_be_unique(column_list=["title", "description"])  # data leaks
+    df.expect_column_values_to_not_be_null(column="tag")  # missing values
+    df.expect_column_values_to_be_unique(column="id")  # unique values
+    df.expect_column_values_to_be_of_type(column="title", type_="str")  # type adherence
+
+    # Expectation suite
+    expectation_suite = df.get_expectation_suite(discard_failed_expectations=False)
+    results = df.validate(expectation_suite=expectation_suite, only_return_failures=True).to_json_dict()
+    assert results["success"]
--- a/tests/model/conftest.py
+++ b/tests/model/conftest.py
@@ -0,0 +1,20 @@
+import pytest
+from ray.train.torch.torch_predictor import TorchPredictor
+
+from madewithml import predict
+
+
+def pytest_addoption(parser):
+    parser.addoption("--run-id", action="store", default=None, help="Run ID of model to use.")
+
+
+@pytest.fixture(scope="module")
+def run_id(request):
+    return request.config.getoption("--run-id")
+
+
+@pytest.fixture(scope="module")
+def predictor(run_id):
+    best_checkpoint = predict.get_best_checkpoint(run_id=run_id)
+    predictor = TorchPredictor.from_checkpoint(best_checkpoint)
+    return predictor
--- a/tests/model/test_behavioral.py
+++ b/tests/model/test_behavioral.py
@@ -0,0 +1,65 @@
+import pytest
+import utils
+
+
+@pytest.mark.parametrize(
+    "input_a, input_b, label",
+    [
+        (
+            "Transformers applied to NLP have revolutionized machine learning.",
+            "Transformers applied to NLP have disrupted machine learning.",
+            "natural-language-processing",
+        ),
+    ],
+)
+def test_invariance(input_a, input_b, label, predictor):
+    """INVariance via verb injection (changes should not affect outputs)."""
+    label_a = utils.get_label(text=input_a, predictor=predictor)
+    label_b = utils.get_label(text=input_b, predictor=predictor)
+    assert label_a == label_b == label
+
+
+@pytest.mark.parametrize(
+    "input, label",
+    [
+        (
+            "ML applied to text classification.",
+            "natural-language-processing",
+        ),
+        (
+            "ML applied to image classification.",
+            "computer-vision",
+        ),
+        (
+            "CNNs for text classification.",
+            "natural-language-processing",
+        ),
+    ],
+)
+def test_directional(input, label, predictor):
+    """DIRectional expectations (changes with known outputs)."""
+    prediction = utils.get_label(text=input, predictor=predictor)
+    assert label == prediction
+
+
+@pytest.mark.parametrize(
+    "input, label",
+    [
+        (
+            "Natural language processing is the next big wave in machine learning.",
+            "natural-language-processing",
+        ),
+        (
+            "MLOps is the next big wave in machine learning.",
+            "mlops",
+        ),
+        (
+            "This is about graph neural networks.",
+            "other",
+        ),
+    ],
+)
+def test_mft(input, label, predictor):
+    """Minimum Functionality Tests (simple input/output pairs)."""
+    prediction = utils.get_label(text=input, predictor=predictor)
+    assert label == prediction
--- a/tests/model/utils.py
+++ b/tests/model/utils.py
@@ -0,0 +1,12 @@
+import numpy as np
+import pandas as pd
+
+from madewithml import predict
+
+
+def get_label(text, predictor):
+    df = pd.DataFrame({"title": [text], "description": "", "tag": "other"})
+    z = predictor.predict(data=df)["predictions"]
+    preprocessor = predictor.get_preprocessor()
+    label = predict.decode(np.stack(z).argmax(1), preprocessor.index_to_class)[0]
+    return label