cog-imperial · kalset1 · Jun 16, 2023 · Jun 20, 2023 · Jun 20, 2023 · Jun 20, 2023
diff --git a/setup.cfg b/setup.cfg
@@ -70,6 +70,7 @@ testing =
     pytest-cov
     testbook
     nbmake
+    nbformat
     tox
     flake8
     tensorflow
@@ -94,6 +95,7 @@ testing_lean =
     pytest-cov
     testbook
     nbmake
+    nbformat
     tox
     flake8
     ipywidgets

diff --git a/tests/notebooks/test_run_notebooks.py b/tests/notebooks/test_run_notebooks.py
@@ -1,54 +1,295 @@
 import os
 
+import nbformat
 import pytest
 from pyomo.common.fileutils import this_file_dir
 from testbook import testbook
 
 from omlt.dependencies import keras_available, onnx_available
 
+# TODO: We need to try and write these tests to rely on internal consistencies and less on absolute numbers and tolerances
 
-# TODO: These will be replaced with stronger tests using testbook soon
-def _test_run_notebook(folder, notebook_fname, n_cells):
-    # change to notebook directory to allow testing
-    cwd = os.getcwd()
+
+# return testbook for given notebook
+def open_book(folder, notebook_fname, **kwargs):
+    execute = kwargs.get("execute", True)
     os.chdir(os.path.join(this_file_dir(), "..", "..", "docs", "notebooks", folder))
-    with testbook(notebook_fname, timeout=300, execute=True) as tb:
-        assert tb.code_cells_executed == n_cells
-    os.chdir(cwd)
+    book = testbook(notebook_fname, execute=execute, timeout=300)
+    return book
+
+
+# checks that the number of executed cells matches the expected
+def check_cell_execution(tb, notebook_fname, **kwargs):
+    injections = kwargs.get("injections", 0)
+    assert (
+        tb.code_cells_executed
+        == cell_counter(notebook_fname, only_code_cells=True) + injections
+    )
+
+
+# checks for correct type and number of layers in a model
+def check_layers(tb, activations, network):
+    tb.inject(
+        f"""
+                    activations = {activations}
+                    for layer_id, layer in enumerate({network}):
+                        assert activations[layer_id] in str(layer.activation)
+                """
+    )
+
+
+# counting number of cells
+def cell_counter(notebook_fname, **kwargs):
+    only_code_cells = kwargs.get("only_code_cells", False)
+    nb = nbformat.read(notebook_fname, as_version=4)
+    nb = nbformat.validator.normalize(nb)[1]
+    if only_code_cells:
+        total = 0
+        for cell in nb.cells:
+            if cell["cell_type"] == "code" and len(cell["source"]) != 0:
+                total += 1
+        return total
+    else:
+        return len(nb.cells)
+
+
+# gets model stats for mnist notebooks
+def mnist_stats(tb, fname):
+    total_cells = cell_counter(fname)
+    tb.inject("test(model, test_loader)")
+    model_stats = tb.cell_output_text(total_cells)
+    model_stats = model_stats.split(" ")
+    loss = float(model_stats[4][:-1])
+    accuracy = int(model_stats[-2][:-6])
+    return (loss, accuracy)
+
+
+# neural network formulation notebook helper
+def neural_network_checker(tb, ref_string, val1, val2, tolerance):
+    x = tb.ref(f"{ref_string}[0]")
+    y = tb.ref(f"{ref_string}[1]")
+    assert x == pytest.approx(val1, abs=tolerance)
+    assert y == pytest.approx(val2, abs=tolerance)
 
 
 @pytest.mark.skipif(not keras_available, reason="keras needed for this notebook")
 def test_autothermal_relu_notebook():
-    _test_run_notebook("neuralnet", "auto-thermal-reformer-relu.ipynb", 13)
+    notebook_fname = "auto-thermal-reformer-relu.ipynb"
+    book = open_book("neuralnet", notebook_fname)
+
+    with book as tb:
+        check_cell_execution(tb, notebook_fname)
+
+        # check loss of model
+        model_loss = tb.ref("nn.evaluate(x, y)")
+        assert model_loss == pytest.approx(0.000389626, abs=0.00031)
+
+        # check layers of model
+        layers = ["relu", "relu", "relu", "relu", "linear"]
+        check_layers(tb, layers, "nn.layers")
+
+        # check final values
+        bypassFraction = tb.ref("pyo.value(m.reformer.inputs[0])")
+        ngRatio = tb.ref("pyo.value(m.reformer.inputs[1])")
+        h2Conc = tb.ref("pyo.value(m.reformer.outputs[h2_idx])")
+        n2Conc = tb.ref("pyo.value(m.reformer.outputs[n2_idx])")
+
+        assert bypassFraction == 0.1
+        assert ngRatio == pytest.approx(1.12, abs=0.05)
+        assert h2Conc == pytest.approx(0.33, abs=0.03)
+        assert n2Conc == pytest.approx(0.34, abs=0.01)
 
 
 @pytest.mark.skipif(not keras_available, reason="keras needed for this notebook")
 def test_autothermal_reformer():
-    _test_run_notebook("neuralnet", "auto-thermal-reformer.ipynb", 13)
+    notebook_fname = "auto-thermal-reformer.ipynb"
+    book = open_book("neuralnet", notebook_fname)
+
+    with book as tb:
+        check_cell_execution(tb, notebook_fname)
+
+        # check loss of model
+        model_loss = tb.ref("nn.evaluate(x, y)")
+        assert model_loss == pytest.approx(0.00024207, abs=0.00021)
+
+        # check layers of model
+        layers = ["sigmoid", "sigmoid", "sigmoid", "sigmoid", "linear"]
+        check_layers(tb, layers, "nn.layers")
+
+        # check final values
+        bypassFraction = tb.ref("pyo.value(m.reformer.inputs[0])")
+        ngRatio = tb.ref("pyo.value(m.reformer.inputs[1])")
+        h2Conc = tb.ref("pyo.value(m.reformer.outputs[h2_idx])")
+        n2Conc = tb.ref("pyo.value(m.reformer.outputs[n2_idx])")
+
+        assert bypassFraction == pytest.approx(0.1, abs=0.009)
+        assert ngRatio == pytest.approx(1.12, abs=0.09)
+        assert h2Conc == pytest.approx(0.33, abs=0.09)
+        assert n2Conc == pytest.approx(0.34, abs=0.09)
 
 
 def test_build_network():
-    _test_run_notebook("neuralnet", "build_network.ipynb", 37)
+    notebook_fname = "build_network.ipynb"
+    book = open_book("neuralnet", notebook_fname)
+
+    with book as tb:
+        check_cell_execution(tb, notebook_fname)
+
+        # check for correct layers
+        layers = ["linear", "linear", "relu"]
+        check_layers(tb, layers, "list(net.layers)")
+
+        m_layers = tb.ref("list(m.neural_net.layer)")
+        assert len(m_layers) == 3
+
+        # check eval function
+        eval_ex = list(tb.ref("x"))
+        assert eval_ex[0] == pytest.approx(2.15)
 
 
 @pytest.mark.skipif(
     (not onnx_available) or (not keras_available),
     reason="onnx and keras needed for this notebook",
 )
 def test_import_network():
-    _test_run_notebook("neuralnet", "import_network.ipynb", 16)
+    notebook_fname = "import_network.ipynb"
+    book = open_book("neuralnet", notebook_fname, execute=False)
+
+    with book as tb:
+        # inject cell that reads in loss and accuracy of keras model
+        # TODO: add something that checks where to inject code cell instead of hardcoding
+        tb.inject(
+            "keras_loss, keras_accuracy = model.evaluate(X, Y)", before=25, run=False
+        )
+        tb.execute()
+
+        check_cell_execution(tb, notebook_fname, injections=1)
+
+        # check input bounds
+        input_bounds = tb.ref("input_bounds")
+        assert input_bounds == [
+            [0.0, 17.0],
+            [0.0, 199.0],
+            [0.0, 122.0],
+            [0.0, 99.0],
+            [0.0, 846.0],
+            [0.0, 67.1],
+            [0.078, 2.42],
+            [21.0, 81.0],
+        ]
+
+        # checking accuracy and loss of keras model
+        keras_loss, keras_accuracy = tb.ref("keras_loss"), tb.ref("keras_accuracy")
+        assert keras_loss == pytest.approx(5.4, abs=4.8)
+        assert keras_accuracy == pytest.approx(0.48, abs=0.21)
+
+        # checking loss of pytorch model
+        pytorch_loss = tb.ref("loss.item()")
+        assert pytorch_loss == pytest.approx(0.25, abs=0.1)
+
+        # checking the model that was imported
+        imported_input_bounds = tb.ref("network_definition.scaled_input_bounds")
+        assert imported_input_bounds == {
+            "0": [0.0, 17.0],
+            "1": [0.0, 199.0],
+            "2": [0.0, 122.0],
+            "3": [0.0, 99.0],
+            "4": [0.0, 846.0],
+            "5": [0.0, 67.1],
+            "6": [0.078, 2.42],
+            "7": [21.0, 81.0],
+        }
+
+        # checking the imported layers
+        layers = ["linear", "relu", "relu", "linear"]
+        check_layers(tb, layers, "network_definition.layers")
 
 
 @pytest.mark.skipif(not onnx_available, reason="onnx needed for this notebook")
 def test_mnist_example_convolutional():
-    _test_run_notebook("neuralnet", "mnist_example_convolutional.ipynb", 13)
+    notebook_fname = "mnist_example_convolutional.ipynb"
+    book = open_book("neuralnet", notebook_fname)
+
+    with book as tb:
+        check_cell_execution(tb, notebook_fname)
+
+        # checking training accuracy
+        loss, accuracy = mnist_stats(tb, notebook_fname)
+        # TODO: These rel and abs tolerances are too specific - fragile?
+        assert loss == pytest.approx(0.3, abs=0.24)
+        assert accuracy / 10000 == pytest.approx(0.91, abs=0.09)
+
+        # checking the imported layers
+        layers = ["linear", "relu", "relu", "relu", "linear"]
+        check_layers(tb, layers, "network_definition.layers")
+
+        # checking optimal solution
+        optimal_sol = tb.ref(
+            "-(pyo.value(m.nn.outputs[0,adversary]-m.nn.outputs[0,label]))"
+        )
+        assert optimal_sol == pytest.approx(11, abs=6.9)
 
 
 @pytest.mark.skipif(not onnx_available, reason="onnx needed for this notebook")
 def test_mnist_example_dense():
-    _test_run_notebook("neuralnet", "mnist_example_dense.ipynb", 13)
+    notebook_fname = "mnist_example_dense.ipynb"
+    book = open_book("neuralnet", notebook_fname)
+
+    with book as tb:
+        check_cell_execution(tb, notebook_fname)
+
+        # checking training accuracy
+        loss, accuracy = mnist_stats(tb, notebook_fname)
+        assert loss == pytest.approx(0.0867, abs=0.09)
+        assert accuracy / 10000 == pytest.approx(0.93, abs=0.07)
+
+        # checking the imported layers
+        layers = ["linear", "relu", "relu", "linear"]
+        check_layers(tb, layers, "network_definition.layers")
+
+        # checking optimal solution
+        optimal_sol = tb.ref(
+            "-(pyo.value(m.nn.outputs[adversary]-m.nn.outputs[label]))"
+        )
+        assert optimal_sol == pytest.approx(5, abs=3.3)
 
 
 @pytest.mark.skipif(not keras_available, reason="keras needed for this notebook")
 def test_neural_network_formulations():
-    _test_run_notebook("neuralnet", "neural_network_formulations.ipynb", 21)
+    notebook_fname = "neural_network_formulations.ipynb"
+    book = open_book("neuralnet", notebook_fname)
+
+    with book as tb:
+        check_cell_execution(tb, notebook_fname)
+
+        # checking loss of keras models
+        losses = [
+            tb.ref(f"nn{x + 1}.evaluate(x=df['x_scaled'], y=df['y_scaled'])")
+            for x in range(3)
+        ]
+        assert losses[0] == pytest.approx(0.000534, abs=0.001)
+        assert losses[1] == pytest.approx(0.000691, abs=0.001)
+        assert losses[2] == pytest.approx(0.006, abs=0.005)
+
+        # checking scaled input bounds
+        scaled_input = tb.ref("input_bounds[0]")
+        assert scaled_input[0] == pytest.approx(-1.73179, abs=0.3)
+        assert scaled_input[1] == pytest.approx(1.73179, abs=0.3)
+
+        # checking optimal solutions
+        neural_network_checker(tb, "solution_1_reduced", -0.8, 0.8, 2.4)
+        neural_network_checker(tb, "solution_1_full", -0.27382, -0.86490, 2.4)
+        neural_network_checker(tb, "solution_2_comp", -0.29967, -0.84415, 2.4)
+        neural_network_checker(tb, "solution_2_bigm", -0.29967, -0.84414, 2.4)
+        neural_network_checker(tb, "solution_3_mixed", -0.23955, -0.90598, 2.4)
+
+
+@pytest.mark.skipif(not onnx_available, reason="onnx needed for this notebook")
+def test_bo_with_trees():
+    notebook_fname = "bo_with_trees.ipynb"
+    book = open_book("", notebook_fname)
+
+    with book as tb:
+        check_cell_execution(tb, notebook_fname)
+
+        # not sure what to put here...