Source code for sasmodels.model_test

# -*- coding: utf-8 -*-
"""
Run model unit tests.

Usage::

    python -m sasmodels.model_test [opencl|cuda|dll|all] model1 model2 ...

If model1 is 'all', then all except the remaining models will be tested.
Subgroups are also possible, such as 'py', 'single' or '1d'.  See
:func:`.core.list_models` for details.

Each model is tested using the default parameters at q=0.1, (qx, qy)=(0.1, 0.1),
and Fq is called to make sure R_eff, volume and volume ratio are computed.
The return values at these points are not considered.  The test is only to
verify that the models run to completion, and do not produce inf or NaN.

Tests are defined with the *tests* attribute in the model.py file.  *tests*
is a list of individual tests to run, where each test consists of the
parameter values for the test, the q-values and the expected results.  For
the effective radius test and volume ratio tests, use the extended output
form, which checks each output of kernel.Fq. For 1-D tests, either specify
the q value or a list of q-values, and the corresponding I(q) value, or
list of I(q) values.

That is::

    tests = [
        [ {parameters}, q, I(q)],
        [ {parameters}, [q], [I(q)] ],
        [ {parameters}, [q1, q2, ...], [I(q1), I(q2), ...]],

        [ {parameters}, (qx, qy), I(qx, Iqy)],
        [ {parameters}, [(qx1, qy1), (qx2, qy2), ...],
                        [I(qx1, qy1), I(qx2, qy2), ...]],

        [ {parameters}, q, F(q), F^2(q), R_eff, V, V_r ],
        ...
    ]

Parameters are *key:value* pairs, where key is one of the parameters of the
model and value is the value to use for the test.  Any parameters not given
in the parameter list will take on the default parameter value.

Precision defaults to 5 digits (relative).
"""
from __future__ import print_function

import argparse
import sys
import unittest
import traceback

try:
    from StringIO import StringIO
except ImportError:
    # StringIO.StringIO renamed to io.StringIO in Python 3
    # Note: io.StringIO exists in python 2, but using unicode instead of str
    from io import StringIO

import numpy as np  # type: ignore

from .core import list_models, load_model_info, build_model
from .direct_model import call_kernel, call_Fq
from .exception import annotate_exception
from .modelinfo import expand_pars
from .kernelcl import use_opencl
from .kernelcuda import use_cuda
from . import product

# pylint: disable=unused-import
try:
    from typing import List, Iterator, Callable, Any, Dict, Tuple, Union
    from .modelinfo import ParameterTable, ParameterSet, TestCondition, ModelInfo
    from .kernel import KernelModel
    DType = Union[None, str, np.dtype]
except ImportError:
    pass
# pylint: enable=unused-import

[docs]def make_suite(loaders, models): # type: (List[str], List[str]) -> unittest.TestSuite """ Construct the pyunit test suite. *loaders* is the list of kernel drivers to use (dll, opencl or cuda). For python model the python driver is always used. *models* is the list of models to test, or *["all"]* to test all models. """ suite = unittest.TestSuite() try: # See if the first model parses as a model group group = list_models(models[0]) skip = models[1:] models = group except Exception: skip = [] for model_name in models: if model_name not in skip: model_info = load_model_info(model_name) _add_model_to_suite(loaders, suite, model_info) return suite
def _add_model_to_suite(loaders, suite, model_info): ModelTestCase = _hide_model_case_from_nose() #print('------') #print('found tests in', model_name) #print('------') # if ispy then use the dll loader to call pykernel # don't try to call cl kernel since it will not be # available in some environmentes. is_py = callable(model_info.Iq) # Some OpenCL drivers seem to be flaky, and are not producing the # expected result. Since we don't have known test values yet for # all of our models, we are instead going to compare the results # for the 'smoke test' (that is, evaluation at q=0.1 for the default # parameters just to see that the model runs to completion) between # the OpenCL and the DLL. To do this, we define a 'stash' which is # shared between OpenCL and DLL tests. This is just a list. If the # list is empty (which it will be when DLL runs, if the DLL runs # first), then the results are appended to the list. If the list # is not empty (which it will be when OpenCL runs second), the results # are compared to the results stored in the first element of the list. # This is a horrible stateful hack which only makes sense because the # test suite is thrown away after being run once. stash = [] if is_py: # kernel implemented in python test_name = "%s[python]"%model_info.name test_method_name = "test_%s_python" % model_info.id test = ModelTestCase(test_name, model_info, test_method_name, platform="dll", # so that dtype="double", stash=stash) suite.addTest(test) else: # kernel implemented in C # test using dll if desired if 'dll' in loaders or not use_opencl(): test_name = "%s[dll]"%model_info.name test_method_name = "test_%s_dll" % model_info.id test = ModelTestCase(test_name, model_info, test_method_name, platform="dll", dtype="double", stash=stash) suite.addTest(test) # test using opencl if desired and available if 'opencl' in loaders and use_opencl(): test_name = "%s[opencl]"%model_info.name test_method_name = "test_%s_opencl" % model_info.id # Using dtype=None so that the models that are only # correct for double precision are not tested using # single precision. The choice is determined by the # presence of *single=False* in the model file. test = ModelTestCase(test_name, model_info, test_method_name, platform="ocl", dtype=None, stash=stash) #print("defining", test_name) suite.addTest(test) # test using cuda if desired and available if 'cuda' in loaders and use_cuda(): test_name = "%s[cuda]" % model_info.id test_method_name = "test_%s_cuda" % model_info.id # Using dtype=None so that the models that are only # correct for double precision are not tested using # single precision. The choice is determined by the # presence of *single=False* in the model file. test = ModelTestCase(test_name, model_info, test_method_name, platform="cuda", dtype=None, stash=stash) #print("defining", test_name) suite.addTest(test) def _hide_model_case_from_nose(): # type: () -> type class ModelTestCase(unittest.TestCase): """ Test suit for a particular model with a particular kernel driver. The test suite runs a simple smoke test to make sure the model functions, then runs the list of tests at the bottom of the model description file. """ def __init__(self, test_name, model_info, test_method_name, platform, dtype, stash): # type: (str, ModelInfo, str, str, DType, List[Any]) -> None self.test_name = test_name self.info = model_info self.platform = platform self.dtype = dtype self.stash = stash # container for the results of the first run self._failures = [] # Set of failed target values setattr(self, test_method_name, self.run_all) unittest.TestCase.__init__(self, test_method_name) def run_all(self): # type: () -> None """ Run all the tests in the test suite, including smoke tests. """ smoke_tests = [ # test validity at reasonable values ({}, 0.1, None), ({}, (0.1, 0.1), None), # test validity at q = 0 #({}, 0.0, None), #({}, (0.0, 0.0), None), # test vector form ({}, [0.001, 0.01, 0.1], [None]*3), ({}, [(0.1, 0.1)]*2, [None]*2), # test that Fq will run, and return R_eff, V, V_r ({}, 0.1, None, None, None, None, None), ] tests = smoke_tests #tests = [] if self.info.tests is not None: tests += self.info.tests S_tests = [test for test in tests if '@S' in test[0]] P_tests = [test for test in tests if '@S' not in test[0]] del self._failures[:] try: model = build_model(self.info, dtype=self.dtype, platform=self.platform) results = [self.run_one(model, test) for test in P_tests] for test in S_tests: # pull the S model name out of the test defn pars = test[0].copy() s_name = pars.pop('@S') ps_test = [pars] + list(test[1:]) #print("PS TEST PARAMS!!!",ps_test) # build the P@S model s_info = load_model_info(s_name) ps_info = product.make_product_info(self.info, s_info) ps_model = build_model(ps_info, dtype=self.dtype, platform=self.platform) # run the tests #self.info = ps_model.info #print("SELF.INFO PARAMS!!!",[p.id for p in self.info.parameters.call_parameters]) #print("PS MODEL PARAMETERS:",[p.id for p in ps_model.info.parameters.call_parameters]) results.append(self.run_one(ps_model, ps_test)) if self.stash: for test, target, actual in zip(tests, self.stash[0], results): assert np.all(abs(target-actual) < 5e-5*abs(actual)), \ ("GPU/CPU comparison expected %s but got %s for %s" % (target, actual, test[0])) else: self.stash.append(results) # Check for missing tests. Only do so for the "dll" tests # to reduce noise from both opencl and cuda, and because # python kernels use platform="dll". if self.platform == "dll": missing = [] ## Uncomment the following to require test cases #missing = self._find_missing_tests() if missing: raise ValueError("Missing tests for "+", ".join(missing)) except: annotate_exception(self.test_name) raise if self._failures: msg = ("The following assertions failed for %s:\n %s" % (self.test_name, "\n ".join(self._failures))) raise AssertionError(msg) def _find_missing_tests(self): # type: () -> None """make sure there are 1D and 2D tests as appropriate""" model_has_1D = True model_has_2D = any(p.type == 'orientation' for p in self.info.parameters.kernel_parameters) # Lists of tests that have a result that is not None single = [test for test in self.info.tests if not isinstance(test[2], list) and test[2] is not None] tests_has_1D_single = any(isinstance(test[1], float) for test in single) tests_has_2D_single = any(isinstance(test[1], tuple) for test in single) multiple = [test for test in self.info.tests if isinstance(test[2], list) and not all(result is None for result in test[2])] tests_has_1D_multiple = any(isinstance(test[1][0], float) for test in multiple) tests_has_2D_multiple = any(isinstance(test[1][0], tuple) for test in multiple) missing = [] if model_has_1D and not (tests_has_1D_single or tests_has_1D_multiple): missing.append("1D") if model_has_2D and not (tests_has_2D_single or tests_has_2D_multiple): missing.append("2D") return missing def run_one(self, model, test): # type: (KernelModel, TestCondition) -> None """Run a single test case.""" user_pars, x, y = test[:3] #print("PS MODEL PARAMETERS:",[p.id for p in model.info.parameters.call_parameters]) pars = expand_pars(model.info.parameters, user_pars) invalid = invalid_pars(model.info.parameters, pars) if invalid: raise ValueError("Unknown parameters in test: " + ", ".join(invalid)) if not isinstance(y, list): y = [y] if not isinstance(x, list): x = [x] self.assertEqual(len(y), len(x)) if isinstance(x[0], tuple): qx, qy = zip(*x) q_vectors = [np.array(qx), np.array(qy)] else: q_vectors = [np.array(x)] kernel = model.make_kernel(q_vectors) if len(test) == 3 or len(test) == 4: actual = call_kernel(kernel, pars) self._check_vectors(x, y, actual, 'I') if len(test) == 4: results = getattr(kernel, 'results', lambda: {}) self._check_struct(x, test[3], results()) return actual elif len(test) == 7: y1 = y y2 = test[3] if isinstance(test[3], list) else [test[3]] F, Fsq, R_eff, volume, volume_ratio = call_Fq(kernel, pars) if F is not None: # F is none for models with Iq instead of Fq self._check_vectors(x, y1, F, 'F') self._check_vectors(x, y2, Fsq, 'F^2') self._check_scalar(test[4], R_eff, 'R_eff') self._check_scalar(test[5], volume, 'volume') self._check_scalar(test[6], volume_ratio, 'form:shell ratio') return Fsq else: self._failures.append('wrong number or results for %s => %s' % (str(user_pars), str(test[2:]))) def _check_scalar(self, target, actual, name): if not is_near(target, actual, 5): self._failures.append('%s: expected:%s; actual:%s' % (name, target, actual)) def _check_vectors(self, x, target, actual, name='I'): if not len(actual) > 0: self._failures.append('%s(...) expected return value'%name) return if target is None: return if len(target) != len(actual): self._failures.append('%s(...) returned wrong length in %s' % (name, str(actual))) return for xi, yi, actual_yi in zip(x, target, actual): if not is_near(yi, actual_yi, 5): # convert array to list so we have comma separated output actual = actual.tolist() self._failures.append('%s(%s): expected:%s; actual:%s' % (name, xi, target, actual)) # Whole list is printed on any error, so fail on first return def _check_struct(self, x, target, actual): for k, v in target.items(): if k not in actual: self._failures.append('key %r not in returned value' % k) continue target_k = v actual_k = actual[k] if np.isscalar(actual_k): # number self._check_scalar(target_k, actual_k, k) elif isinstance(actual_k, np.ndarray): # vector self._check_vectors(x, target_k, actual_k, k) elif isinstance(actual_k, tuple) and len(actual_k) == 2: # Intermediate is returned as (Q, I(Q)) pair. The test # is set up to use |Q| or (Qx, Qy) as input, but the # returned result has (|Q|,) or (Qx, Qy). For now we will # ignore the first result. #self._check_vectors(x, x, actual_k[0], k+" (Q)") self._check_vectors(x, target_k, actual_k[1], k) elif isinstance(actual_k, dict): self._check_struct(x, target_k, actual_k) else: self._failures.append('key %s: unexpected value %r' % (k, actual_k)) # Ignore effective_radius in returned result; it will be dropped actual.pop('effective_radius', None) if any(k not in target for k in actual): self._failures.append('intermediate results missing:') for k, v in actual.items(): if k not in target: if isinstance(v, tuple) and len(v) == 2: v = v[1].tolist() elif isinstance(v, np.ndarray): v = v.tolist() self._failures.append(' "%s": %r,' % (k, v)) return ModelTestCase
[docs]def invalid_pars(partable, pars): # type: (ParameterTable, Dict[str, float]) -> List[str] """ Return a list of parameter names that are not part of the model. """ names = set(p.id for p in partable.call_parameters) invalid = [] for par in sorted(pars.keys()): # Ignore the R_eff mode parameter when checking for valid parameters. # It is an allowed parameter for a model even though it does not exist # in the parameter table. The call_Fq() function pops it from the # parameter list and sends it directly to kernel.Fq(). if par == product.RADIUS_MODE_ID: continue parts = par.split('_pd') if len(parts) > 1 and parts[1] not in ("", "_n", "nsigma", "type"): invalid.append(par) continue if parts[0] not in names: invalid.append(par) return invalid
[docs]def is_near(target, actual, digits=5): # type: (float, float, int) -> bool """ Returns true if *actual* is within *digits* significant digits of *target*. *taget* zero and inf should match *actual* zero and inf. If you want to accept eps for zero, choose a value such as 1e-10, which must match up to +/- 1e-15 when *digits* is the default value of 5. If *target* is None, then just make sure that *actual* is not NaN. If *target* is NaN, make sure *actual* is NaN. """ if target is None: # target is None => actual cannot be NaN return not np.isnan(actual) elif target == 0.: # target is 0. => actual must be 0. # Note: if small values are allowed, then use maybe test zero against eps instead? return actual == 0. elif np.isfinite(target): shift = np.ceil(np.log10(abs(target))) return abs(target-actual) < 1.5*10**(shift-digits) elif target == actual: # target is inf => actual must be inf of same sign return True else: # target is NaN => actual must be NaN return np.isnan(target) == np.isnan(actual)
# CRUFT: old interface; should be deprecated and removed
[docs]def run_one(model_name): # type: (str) -> str """ [Deprecated] Run the tests associated with *model_name*. Use the following instead:: succss, output = check_model(load_model_info(model_name)) """ # msg = "use check_model(model_info) rather than run_one(model_name)" # warnings.warn(msg, category=DeprecationWarning, stacklevel=2) try: model_info = load_model_info(model_name) except Exception: output = traceback.format_exc() return output _, output = check_model(model_info) return output
[docs]def check_model(model_info): # type: (ModelInfo) -> Tuple[bool, str] """ Run the tests for a single model, capturing the output. Returns success status and the output string. """ # Note that running main() directly did not work from within the # wxPython pycrust console. Instead of the results appearing in the # window they were printed to the underlying console. from unittest.runner import TextTestResult, _WritelnDecorator # Build a object to capture and print the test results stream = _WritelnDecorator(StringIO()) # Add writeln() method to stream verbosity = 2 descriptions = True result = TextTestResult(stream, descriptions, verbosity) # Build a test suite containing just the model loaders = ['opencl' if use_opencl() else 'cuda' if use_cuda() else 'dll'] suite = unittest.TestSuite() _add_model_to_suite(loaders, suite, model_info) # Warn if there are no user defined tests. # Note: the test suite constructed above only has one test in it, which # runs through some smoke tests to make sure the model runs, then runs # through the input-output pairs given in the model definition file. To # check if any such pairs are defined, therefore, we just need to check if # they are in the first test of the test suite. We do this with an # iterator since we don't have direct access to the list of tests in the # test suite. # In Qt5 suite.run() will clear all tests in the suite after running # with no way of retaining them for the test below, so let's check # for user tests before running the suite. for test in suite: if not test.info.tests: stream.writeln("Note: %s has no user defined tests."%model_info.name) break else: stream.writeln("Note: no test suite created --- this should never happen") # Run the test suite suite.run(result) # Print the failures and errors for _, tb in result.errors: stream.writeln(tb) for _, tb in result.failures: stream.writeln(tb) output = stream.getvalue() stream.close() return result.wasSuccessful(), output
[docs]def model_tests(): # type: () -> Iterator[Callable[[], None]] """ Test runner visible to nosetests. Run "nosetests sasmodels" on the command line to invoke it. """ loaders = ['dll'] if use_opencl(): loaders.append('opencl') if use_cuda(): loaders.append('cuda') tests = make_suite(loaders, ['all']) def _build_test(test): # In order for nosetest to show the test name, wrap the test.run_all # instance in function that takes the test name as a parameter which # will be displayed when the test is run. Do this as a function so # that it properly captures the context for tests that captured and # run later. If done directly in the for loop, then the looping # variable test will be shared amongst all the tests, and we will be # repeatedly testing vesicle. # Note: in sasview sas.sasgui.perspectives.fitting.gpu_options # requires that the test.description field be set. wrap = lambda: test.run_all() wrap.description = test.test_name return wrap # The following would work with nosetests and pytest: # return lambda name: test.run_all(), test.test_name for test in tests: yield _build_test(test)
[docs]def main(): # type: () -> int """ Run tests given is models. Returns 0 if success or 1 if any tests fail. """ try: from xmlrunner import XMLTestRunner as TestRunner test_args = {'output': 'logs'} except ImportError: from unittest import TextTestRunner as TestRunner test_args = {} parser = argparse.ArgumentParser(description="Test SasModels Models") parser.add_argument("-v", "--verbose", action="store_const", default=1, const=2, help="Use verbose output") parser.add_argument("-e", "--engine", default="all", help="Engines on which to run the test. " "Valid values are opencl, cuda, dll, and all. " "Defaults to all if no value is given") parser.add_argument("models", nargs="*", help="The names of the models to be tested. " "If the first model is 'all', then all but the listed " "models will be tested. See core.list_models() for " "names of other groups, such as 'py' or 'single'.") opts = parser.parse_args() if opts.engine == "opencl": if not use_opencl(): print("opencl is not available") return 1 loaders = ['opencl'] elif opts.engine == "dll": loaders = ["dll"] elif opts.engine == "cuda": if not use_cuda(): print("cuda is not available") return 1 loaders = ['cuda'] elif opts.engine == "all": loaders = ['dll'] if use_opencl(): loaders.append('opencl') if use_cuda(): loaders.append('cuda') else: print("unknown engine " + opts.engine) return 1 runner = TestRunner(verbosity=opts.verbose, **test_args) result = runner.run(make_suite(loaders, opts.models)) return 1 if result.failures or result.errors else 0
if __name__ == "__main__": sys.exit(main())