DCNmodel/cnmodel/util/user_tester.py

from __future__ import print_function
import os, sys, pickle, pprint
import numpy as np
import pyqtgraph as pg
from .. import AUDIT_TESTS


class UserTester(object):
    """
    Base class for testing when a human is required to verify the results.
    
    When a test is passed by the user, its output is saved and used as a basis
    for future tests. If future test results do not match the stored results,
    then the user is asked to decide whether to fail the test, or pass the
    test and store new results.
    
    Subclasses must reimplement run_test() to return a dictionary of results
    to store. Optionally, compare_results and audit_result may also be
    reimplemented to customize the testing behavior.
    
    By default, test results are stored in a 'test_data' directory relative
    to the file that defines the UserTester subclass in use.
    """

    data_dir = "test_data"

    def __init__(self, key, *args, **kwds):
        """Initialize with a string *key* that provides a short, unique 
        description of this test. All other arguments are passed to run_test().
        
        *key* is used to determine the file name for storing test results. 
        """
        self.audit = AUDIT_TESTS
        self.key = key
        self.rtol = 1e-3
        self.args = args
        self.assert_test_info(*args, **kwds)

    def run_test(self, *args, **kwds):
        """
        Exceute the test. All arguments are taken from __init__.
        Return a picklable dictionary of test results.
        """
        raise NotImplementedError()

    def compare_results(self, key, info, expect):
        """
        Compare *result* of the current test against the previously stored 
        result *expect*. If *expect* is None, then no previous result was 
        stored.
        
        If *result* and *expect* do not match, then raise an exception.
        """
        # Check test structures are the same
        assert type(info) is type(expect)
        if hasattr(info, "__len__"):
            assert len(info) == len(expect)

        if isinstance(info, dict):
            for k in info:
                assert k in expect
            for k in expect:
                assert k in info
                self.compare_results(k, info[k], expect[k])
        elif isinstance(info, list):
            for i in range(len(info)):
                self.compare_results(key, info[i], expect[i])
        elif isinstance(info, np.ndarray):
            assert info.shape == expect.shape
            if len(info) == 0:
                return
            # assert info.dtype == expect.dtype
            if info.dtype.fields is None:
                intnan = -9223372036854775808  # happens when np.nan is cast to int
                inans = np.isnan(info) | (info == intnan)
                enans = np.isnan(expect) | (expect == intnan)
                assert np.all(inans == enans)
                mask = ~inans
                if not np.allclose(info[mask], expect[mask], rtol=self.rtol):
                    print(
                        "\nComparing data array, shapes match: ",
                        info.shape == expect.shape,
                    )
                    print("Model tested: %s, measure: %s" % (self.key, key))
                    # print( 'args: ', dir(self.args[0]))
                    print("Array expected: ", expect[mask])
                    print("Array received: ", info[mask])
                    try:
                        self.args[0].print_all_mechs()
                    except:
                        print("args[0] is string: ", self.args[0])
                assert np.allclose(info[mask], expect[mask], rtol=self.rtol)
            else:
                for k in info.dtype.fields.keys():
                    self.compare_results(k, info[k], expect[k])
        elif np.isscalar(info):
            if not np.allclose(info, expect, rtol=self.rtol):
                print("Comparing Scalar data, model: %s, measure: %s" % (self.key, key))
                # print 'args: ', dir(self.args[0])
                print(
                    "Expected: ",
                    expect,
                    ",  received: ",
                    info,
                    "  relative tolerance: ",
                    self.rtol,
                )
                if isinstance(self.args[0], str):
                    pass
                    # print ': ', str
                else:
                    self.args[0].print_all_mechs()
            assert np.allclose(info, expect, rtol=self.rtol)
        else:
            try:
                assert info == expect
            except AssertionError:
                raise
            except Exception:
                raise NotImplementedError(
                    "Cannot compare objects of type %s" % type(info)
                )

    def audit_result(self, info, expect):
        """ Display results and ask the user to decide whether the test passed.
        Return True for pass, False for fail.
        
        If *expect* is None, then no previous test results were stored.
        """
        app = pg.mkQApp()
        print("\n=== New test results for %s: ===\n" % self.key)
        pprint.pprint(info)

        # we use DiffTreeWidget to display differences between large data structures, but
        # this is not present in mainline pyqtgraph yet
        if hasattr(pg, "DiffTreeWidget"):
            win = pg.DiffTreeWidget()
        else:
            from cnmodel.util.difftreewidget import DiffTreeWidget

            win = DiffTreeWidget()

        win.resize(800, 800)
        win.setData(expect, info)
        win.show()
        print("Store new test results? [y/n]")
        yn = raw_input()
        win.hide()
        return yn.lower().startswith("y")

    def assert_test_info(self, *args, **kwds):
        """
        Test *cell* and raise exception if the results do not match prior
        data.
        """
        result = self.run_test(*args, **kwds)
        expect = self.load_test_result()
        try:
            assert expect is not None
            self.compare_results(None, result, expect)
        except:
            if not self.audit:
                if expect is None:
                    raise Exception(
                        "No prior test results for test '%s'. "
                        "Run test.py --audit store new test data." % self.key
                    )
                else:
                    raise

            store = self.audit_result(result, expect)
            if store:
                self.save_test_result(result)
            else:
                raise Exception("Rejected test results for '%s'" % self.key)

    def result_file(self):
        """
        Return a file name to be used for storing / retrieving test results
        given *self.key*.
        """
        modfile = sys.modules[self.__class__.__module__].__file__
        path = os.path.dirname(modfile)
        return os.path.join(path, self.data_dir, self.key + ".pk")

    def load_test_result(self):
        """
        Load prior test results for *self.key*.
        If there are no prior results, return None.
        """
        fn = self.result_file()
        if os.path.isfile(fn):
            return pickle.load(open(fn, "rb"), encoding="latin1")
        return None

    def save_test_result(self, result):
        """
        Store test results for *self.key*.
        Th e*result* argument must be picklable.
        """
        fn = self.result_file()
        dirname = os.path.dirname(fn)
        if not os.path.isdir(dirname):
            os.mkdir(dirname)
        pickle.dump(result, open(fn, "wb"))
copying to personal repo 3 years ago			`from __future__ import print_function`
			`import os, sys, pickle, pprint`
			`import numpy as np`
			`import pyqtgraph as pg`
			`from .. import AUDIT_TESTS`


			`class UserTester(object):`
			`"""`
			`Base class for testing when a human is required to verify the results.`

			`When a test is passed by the user, its output is saved and used as a basis`
			`for future tests. If future test results do not match the stored results,`
			`then the user is asked to decide whether to fail the test, or pass the`
			`test and store new results.`

			`Subclasses must reimplement run_test() to return a dictionary of results`
			`to store. Optionally, compare_results and audit_result may also be`
			`reimplemented to customize the testing behavior.`

			`By default, test results are stored in a 'test_data' directory relative`
			`to the file that defines the UserTester subclass in use.`
			`"""`

			`data_dir = "test_data"`

			`def __init__(self, key, args, *kwds):`
			`"""Initialize with a string key that provides a short, unique`
			`description of this test. All other arguments are passed to run_test().`

			`key is used to determine the file name for storing test results.`
			`"""`
			`self.audit = AUDIT_TESTS`
			`self.key = key`
			`self.rtol = 1e-3`
			`self.args = args`
			`self.assert_test_info(args, *kwds)`

			`def run_test(self, args, *kwds):`
			`"""`
			`Exceute the test. All arguments are taken from __init__.`
			`Return a picklable dictionary of test results.`
			`"""`
			`raise NotImplementedError()`

			`def compare_results(self, key, info, expect):`
			`"""`
			`Compare result of the current test against the previously stored`
			`result expect. If expect is None, then no previous result was`
			`stored.`

			`If result and expect do not match, then raise an exception.`
			`"""`
			`# Check test structures are the same`
			`assert type(info) is type(expect)`
			`if hasattr(info, "__len__"):`
			`assert len(info) == len(expect)`

			`if isinstance(info, dict):`
			`for k in info:`
			`assert k in expect`
			`for k in expect:`
			`assert k in info`
			`self.compare_results(k, info[k], expect[k])`
			`elif isinstance(info, list):`
			`for i in range(len(info)):`
			`self.compare_results(key, info[i], expect[i])`
			`elif isinstance(info, np.ndarray):`
			`assert info.shape == expect.shape`
			`if len(info) == 0:`
			`return`
			`# assert info.dtype == expect.dtype`
			`if info.dtype.fields is None:`
			`intnan = -9223372036854775808 # happens when np.nan is cast to int`
			`inans = np.isnan(info) \| (info == intnan)`
			`enans = np.isnan(expect) \| (expect == intnan)`
			`assert np.all(inans == enans)`
			`mask = ~inans`
			`if not np.allclose(info[mask], expect[mask], rtol=self.rtol):`
			`print(`
			`"\nComparing data array, shapes match: ",`
			`info.shape == expect.shape,`
			`)`
			`print("Model tested: %s, measure: %s" % (self.key, key))`
			`# print( 'args: ', dir(self.args[0]))`
			`print("Array expected: ", expect[mask])`
			`print("Array received: ", info[mask])`
			`try:`
			`self.args[0].print_all_mechs()`
			`except:`
			`print("args[0] is string: ", self.args[0])`
			`assert np.allclose(info[mask], expect[mask], rtol=self.rtol)`
			`else:`
			`for k in info.dtype.fields.keys():`
			`self.compare_results(k, info[k], expect[k])`
			`elif np.isscalar(info):`
			`if not np.allclose(info, expect, rtol=self.rtol):`
			`print("Comparing Scalar data, model: %s, measure: %s" % (self.key, key))`
			`# print 'args: ', dir(self.args[0])`
			`print(`
			`"Expected: ",`
			`expect,`
			`", received: ",`
			`info,`
			`" relative tolerance: ",`
			`self.rtol,`
			`)`
			`if isinstance(self.args[0], str):`
			`pass`
			`# print ': ', str`
			`else:`
			`self.args[0].print_all_mechs()`
			`assert np.allclose(info, expect, rtol=self.rtol)`
			`else:`
			`try:`
			`assert info == expect`
			`except AssertionError:`
			`raise`
			`except Exception:`
			`raise NotImplementedError(`
			`"Cannot compare objects of type %s" % type(info)`
			`)`

			`def audit_result(self, info, expect):`
			`""" Display results and ask the user to decide whether the test passed.`
			`Return True for pass, False for fail.`

			`If expect is None, then no previous test results were stored.`
			`"""`
			`app = pg.mkQApp()`
			`print("\n=== New test results for %s: ===\n" % self.key)`
			`pprint.pprint(info)`

			`# we use DiffTreeWidget to display differences between large data structures, but`
			`# this is not present in mainline pyqtgraph yet`
			`if hasattr(pg, "DiffTreeWidget"):`
			`win = pg.DiffTreeWidget()`
			`else:`
			`from cnmodel.util.difftreewidget import DiffTreeWidget`

			`win = DiffTreeWidget()`

			`win.resize(800, 800)`
			`win.setData(expect, info)`
			`win.show()`
			`print("Store new test results? [y/n]")`
			`yn = raw_input()`
			`win.hide()`
			`return yn.lower().startswith("y")`

			`def assert_test_info(self, args, *kwds):`
			`"""`
			`Test cell and raise exception if the results do not match prior`
			`data.`
			`"""`
			`result = self.run_test(args, *kwds)`
			`expect = self.load_test_result()`
			`try:`
			`assert expect is not None`
			`self.compare_results(None, result, expect)`
			`except:`
			`if not self.audit:`
			`if expect is None:`
			`raise Exception(`
			`"No prior test results for test '%s'. "`
			`"Run test.py --audit store new test data." % self.key`
			`)`
			`else:`
			`raise`

			`store = self.audit_result(result, expect)`
			`if store:`
			`self.save_test_result(result)`
			`else:`
			`raise Exception("Rejected test results for '%s'" % self.key)`

			`def result_file(self):`
			`"""`
			`Return a file name to be used for storing / retrieving test results`
			`given self.key.`
			`"""`
			`modfile = sys.modules[self.__class__.__module__].__file__`
			`path = os.path.dirname(modfile)`
			`return os.path.join(path, self.data_dir, self.key + ".pk")`

			`def load_test_result(self):`
			`"""`
			`Load prior test results for self.key.`
			`If there are no prior results, return None.`
			`"""`
			`fn = self.result_file()`
			`if os.path.isfile(fn):`
			`return pickle.load(open(fn, "rb"), encoding="latin1")`
			`return None`

			`def save_test_result(self, result):`
			`"""`
			`Store test results for self.key.`
			`Th eresult argument must be picklable.`
			`"""`
			`fn = self.result_file()`
			`dirname = os.path.dirname(fn)`
			`if not os.path.isdir(dirname):`
			`os.mkdir(dirname)`
			`pickle.dump(result, open(fn, "wb"))`