python/html/hypothesis__test__util_8py_source.html

 """
 The Hypothesis library uses *property-based testing* to check
 invariants about the code under test under a variety of random inputs.

  The key idea here is to express properties of the code under test
 (e.g. that it passes a gradient check, that it implements a reference
 function, etc), and then generate random instances and verify they
 satisfy these properties.

 The main functions of interest are exposed on `HypothesisTestCase`.
 You can usually just add a short function in this to generate an
 arbitrary number of test cases for your operator.

 The key functions are:

 - `assertDeviceChecks(devices, op, inputs, outputs)`. This asserts that the
   operator computes the same outputs, regardless of which device it is executed
   on.
 - `assertGradientChecks(device, op, inputs, output_,
   outputs_with_grads)`. This implements a standard numerical gradient checker
   for the operator in question.
 - `assertReferenceChecks(device, op, inputs, reference)`. This runs the
   reference function (effectively calling `reference(*inputs)`, and comparing
   that to the output of output.

 `hypothesis_test_util.py` exposes some useful pre-built samplers.

 - `hu.gcs` - a gradient checker device (`gc`) and device checker devices (`dc`)

 - `hu.gcs_cpu_only` - a CPU-only gradient checker device (`gc`) and
   device checker devices (`dc`). Used for when your operator is only
   implemented on the CPU.
 """

 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 from __future__ import unicode_literals
 from caffe2.proto import caffe2_pb2
 from caffe2.python import (
     workspace, device_checker, gradient_checker, test_util, core)
 import contextlib
 import copy
 import hypothesis
 import hypothesis.extra.numpy
 import hypothesis.strategies as st
 import logging
 import numpy as np
 import os


 def is_sandcastle():
     if os.getenv('SANDCASTLE') == '1':
         return True
     elif os.getenv('TW_JOB_USER') == 'sandcastle':
         return True
     return False

 hypothesis.settings.register_profile(
     "sandcastle",
     hypothesis.settings(
         derandomize=True,
         suppress_health_check=[hypothesis.HealthCheck.too_slow],
         database=None,
         max_examples=100,
         verbosity=hypothesis.Verbosity.verbose))

 hypothesis.settings.register_profile(
     "dev",
     hypothesis.settings(
         suppress_health_check=[hypothesis.HealthCheck.too_slow],
         database=None,
         max_examples=10,
         verbosity=hypothesis.Verbosity.verbose))
 hypothesis.settings.register_profile(
     "debug",
     hypothesis.settings(
         suppress_health_check=[hypothesis.HealthCheck.too_slow],
         database=None,
         max_examples=1000,
         verbosity=hypothesis.Verbosity.verbose))
 hypothesis.settings.load_profile(
     'sandcastle' if is_sandcastle() else os.getenv('CAFFE2_HYPOTHESIS_PROFILE',
                                                    'dev')
 )


 def dims(min_value=1, max_value=5):
     return st.integers(min_value=min_value, max_value=max_value)


 def elements_of_type(dtype=np.float32, filter_=None):
     elems = None
     if dtype in (np.float16, np.float32, np.float64):
         elems = st.floats(min_value=-1.0, max_value=1.0)
     elif dtype is np.int32:
         elems = st.integers(min_value=0, max_value=2 ** 31 - 1)
     elif dtype is np.int64:
         elems = st.integers(min_value=0, max_value=2 ** 63 - 1)
     elif dtype is np.bool:
         elems = st.booleans()
     else:
         raise ValueError("Unexpected dtype without elements provided")
     return elems if filter_ is None else elems.filter(filter_)


 def arrays(dims, dtype=np.float32, elements=None):
     if elements is None:
         elements = elements_of_type(dtype)
     return hypothesis.extra.numpy.arrays(dtype, dims, elements=elements)


 def tensor(min_dim=1, max_dim=4, dtype=np.float32, elements=None, **kwargs):
     dims_ = st.lists(dims(**kwargs), min_size=min_dim, max_size=max_dim)
     return dims_.flatmap(lambda dims: arrays(dims, dtype, elements))


 def segment_ids(size, is_sorted):
     if size == 0:
         return st.just(np.empty(shape=[0], dtype=np.int32))
     if is_sorted:
         return arrays(
             [size],
             dtype=np.int32,
             elements=st.booleans()).map(
                 lambda x: np.cumsum(x, dtype=np.int32) - x[0])
     else:
         return arrays(
             [size],
             dtype=np.int32,
             elements=st.integers(min_value=0, max_value=2 * size))


 def lengths(size, **kwargs):
     # First generate number of boarders between segments
     # Then create boarder values and add 0 and size
     # By sorting and computing diff we convert them to lengths of
     # possible 0 value
     if size == 0:
         return st.just(np.empty(shape=[0], dtype=np.int32))
     return st.integers(
         min_value=0, max_value=size - 1
     ).flatmap(lambda num_boarders:
         hypothesis.extra.numpy.arrays(
             np.int32, num_boarders, elements=st.integers(
                 min_value=0, max_value=size
             )
         )
     ).map(lambda x: np.append(x, np.array([0, size], dtype=np.int32))
     ).map(sorted).map(np.diff)


 def segmented_tensor(
     min_dim=1,
     max_dim=4,
     dtype=np.float32,
     is_sorted=True,
     elements=None,
     segment_generator=segment_ids,
     allow_empty=False,
     **kwargs
 ):
     gen_empty = st.booleans() if allow_empty else st.just(False)
     data_dims_ = st.lists(dims(**kwargs), min_size=min_dim, max_size=max_dim)
     data_dims_ = st.tuples(
         gen_empty, data_dims_
     ).map(lambda pair: ([0] if pair[0] else []) + pair[1])
     return data_dims_.flatmap(lambda data_dims: st.tuples(
         arrays(data_dims, dtype, elements),
         segment_generator(data_dims[0], is_sorted=is_sorted),
     ))


 def lengths_tensor(*args, **kwargs):
     return segmented_tensor(*args, segment_generator=lengths, **kwargs)


 def sparse_segmented_tensor(min_dim=1, max_dim=4, dtype=np.float32,
                             is_sorted=True, elements=None, allow_empty=False,
                             segment_generator=segment_ids, **kwargs):
     gen_empty = st.booleans() if allow_empty else st.just(False)
     data_dims_ = st.lists(dims(**kwargs), min_size=min_dim, max_size=max_dim)
     all_dims_ = st.tuples(gen_empty, data_dims_).flatmap(
         lambda pair: st.tuples(
             st.just(pair[1]),
             (st.integers(min_value=1, max_value=pair[1][0]) if not pair[0]
              else st.just(0)),
         ))
     return all_dims_.flatmap(lambda dims: st.tuples(
         arrays(dims[0], dtype, elements),
         arrays(dims[1], dtype=np.int64, elements=st.integers(
             min_value=0, max_value=dims[0][0] - 1)),
         segment_generator(dims[1], is_sorted=is_sorted),
     ))


 def sparse_lengths_tensor(**kwargs):
     return sparse_segmented_tensor(segment_generator=lengths, **kwargs)


 def tensors(n, min_dim=1, max_dim=4, dtype=np.float32, elements=None, **kwargs):
     dims_ = st.lists(dims(**kwargs), min_size=min_dim, max_size=max_dim)
     return dims_.flatmap(
         lambda dims: st.lists(arrays(dims, dtype, elements),
                               min_size=n, max_size=n))

 cpu_do = caffe2_pb2.DeviceOption()
 gpu_do = caffe2_pb2.DeviceOption(device_type=caffe2_pb2.CUDA)
 device_options = [cpu_do] + ([gpu_do] if workspace.has_gpu_support else [])
 # Include device option for each GPU
 expanded_device_options = [cpu_do] + (
     [caffe2_pb2.DeviceOption(device_type=caffe2_pb2.CUDA, cuda_gpu_id=i)
      for i in range(workspace.NumCudaDevices())]
     if workspace.has_gpu_support else [])


 def device_checker_device_options():
     return st.just(device_options)


 def gradient_checker_device_option():
     return st.sampled_from(device_options)


 gcs = dict(
     gc=gradient_checker_device_option(),
     dc=device_checker_device_options()
 )

 gcs_cpu_only = dict(gc=st.sampled_from([cpu_do]), dc=st.just([cpu_do]))
 gcs_gpu_only = dict(gc=st.sampled_from([gpu_do]), dc=st.just([gpu_do]))


 @contextlib.contextmanager
 def temp_workspace(name=b"temp_ws"):
     old_ws_name = workspace.CurrentWorkspace()
     workspace.SwitchWorkspace(name, True)
     yield
     workspace.ResetWorkspace()
     workspace.SwitchWorkspace(old_ws_name)


 def runOpBenchmark(
     device_option,
     op,
     inputs,
     input_device_options=None,
     iterations=10,
 ):
     if input_device_options is None:
         input_device_options = {}
     op = copy.deepcopy(op)
     op.device_option.CopyFrom(device_option)
     net = caffe2_pb2.NetDef()
     net.op.extend([op])
     net.name = op.name if op.name else "test"

     with temp_workspace():
         for (n, b) in zip(op.input, inputs):
             workspace.FeedBlob(
                 n,
                 b,
                 device_option=input_device_options.get(n, device_option)
             )
         workspace.CreateNet(net)
         ret = workspace.BenchmarkNet(net.name, 1, iterations, True)
     return ret


 class HypothesisTestCase(test_util.TestCase):
     """
     A unittest.TestCase subclass with some helper functions for
     utilizing the `hypothesis` (hypothesis.readthedocs.io) library.
     """
     def assertDeviceChecks(
         self,
         device_options,
         op,
         inputs,
         outputs_to_check,
         input_device_options=None,
         threshold=0.01
     ):
         """
         Asserts that the operator computes the same outputs, regardless of
         which device it is executed on.

         Useful for checking the consistency of GPU and CPU
         implementations of operators.

         Usage example:

             @given(inputs=hu.tensors(n=2), in_place=st.booleans(), **hu.gcs)
             def test_sum(self, inputs, in_place, gc, dc):
                 op = core.CreateOperator("Sum", ["X1", "X2"],
                                                 ["Y" if not in_place else "X1"])
                 X1, X2 = inputs
                 self.assertDeviceChecks(dc, op, [X1, X2], [0])
         """
         dc = device_checker.DeviceChecker(
             threshold,
             device_options=device_options
         )
         self.assertTrue(
             dc.CheckSimple(op, inputs, outputs_to_check, input_device_options)
         )

     def assertGradientChecks(
         self,
         device_option,
         op,
         inputs,
         outputs_to_check,
         outputs_with_grads,
         grad_ops=None,
         threshold=0.005,
         stepsize=0.05,
         input_device_options=None,
     ):
         """
         Implements a standard numerical gradient checker for the operator
         in question.

         Useful for checking the consistency of the forward and
         backward implementations of operators.

         Usage example:

             @given(inputs=hu.tensors(n=2), in_place=st.booleans(), **hu.gcs)
             def test_sum(self, inputs, in_place, gc, dc):
                 op = core.CreateOperator("Sum", ["X1", "X2"],
                                                 ["Y" if not in_place else "X1"])
                 X1, X2 = inputs
                 self.assertGradientChecks(gc, op, [X1, X2], 0, [0])
         """
         gc = gradient_checker.GradientChecker(
             stepsize=stepsize,
             threshold=threshold,
             device_option=device_option,
             workspace_name=str(device_option),
         )
         res, grad, grad_estimated = gc.CheckSimple(
             op, inputs, outputs_to_check, outputs_with_grads,
             grad_ops=grad_ops,
             input_device_options=input_device_options
         )
         self.assertEqual(grad.shape, grad_estimated.shape)
         self.assertTrue(
             res,
             "Gradient check failed for input " + str(op.input[outputs_to_check])
         )

     def _assertGradReferenceChecks(
         self,
         op,
         inputs,
         ref_outputs,
         output_to_grad,
         grad_reference,
         threshold=1e-4,
     ):
         grad_blob_name = output_to_grad + '_grad'
         grad_ops, grad_map = core.GradientRegistry.GetBackwardPass(
             [op], {output_to_grad: grad_blob_name})
         output_grad = workspace.FetchBlob(output_to_grad)
         grad_ref_outputs = grad_reference(output_grad, ref_outputs, inputs)
         workspace.FeedBlob(grad_blob_name, workspace.FetchBlob(output_to_grad))
         workspace.RunOperatorsOnce(grad_ops)

         self.assertEqual(len(grad_ref_outputs), len(inputs))
         for (n, ref) in zip(op.input, grad_ref_outputs):
             grad_names = grad_map.get(n)
             if not grad_names:
                 # no grad for this input
                 self.assertIsNone(ref)
             else:
                 if isinstance(grad_names, core.BlobReference):
                     # dense gradient
                     ref_vals = ref
                     ref_indices = None
                     val_name = grad_names
                 else:
                     # sparse gradient
                     ref_vals, ref_indices = ref
                     val_name = grad_names.values
                 vals = workspace.FetchBlob(str(val_name))
                 np.testing.assert_allclose(
                     vals,
                     ref_vals,
                     atol=threshold,
                     rtol=threshold,
                     err_msg='Gradient {0} is not matching the reference'.format(
                         val_name,
                     ),
                 )
                 if ref_indices is not None:
                     indices = workspace.FetchBlob(str(grad_names.indices))
                     np.testing.assert_allclose(indices, ref_indices,
                                                atol=1e-4, rtol=1e-4)

     def _assertInferTensorChecks(self, name, shapes, types, output):
         if name not in shapes:
             # No inferred shape or type available
             return
         output = workspace.FetchBlob(name)
         if type(output) is np.ndarray:
             if output.dtype == np.dtype('float64'):
                 correct_type = caffe2_pb2.TensorProto.DOUBLE
             elif output.dtype == np.dtype('float32'):
                 correct_type = caffe2_pb2.TensorProto.FLOAT
             elif output.dtype == np.dtype('int32'):
                 correct_type = caffe2_pb2.TensorProto.INT32
             elif output.dtype == np.dtype('int64'):
                 correct_type = caffe2_pb2.TensorProto.INT64
             else:
                 correct_type = "unknown {}".format(np.dtype)
         else:
             correct_type = str(type(output))
         try:
             np.testing.assert_array_equal(
                 np.array(shapes[name]).astype(np.int32),
                 np.array(output.shape).astype(np.int32),
                 err_msg='Shape {} mismatch: {} vs. {}'.format(
                     name,
                     shapes[name],
                     output.shape))
             # BUG: Workspace blob type not being set correctly T16121392
             if correct_type != caffe2_pb2.TensorProto.INT32:
                 return
             np.testing.assert_equal(
                 types[name],
                 correct_type,
                 err_msg='Type {} mismatch: {} vs. {}'.format(
                     name, types[name], correct_type,
                 )
             )
         except AssertionError as e:
             # Temporarily catch these assertion errors when validating
             # inferred shape and type info
             logging.warning(str(e))
             if os.getenv('CAFFE2_ASSERT_SHAPEINFERENCE') == '1':
                 raise e

     def assertReferenceChecks(
         self,
         device_option,
         op,
         inputs,
         reference,
         input_device_options=None,
         threshold=1e-4,
         output_to_grad=None,
         grad_reference=None,
         atol=None,
         outputs_to_check=None,
     ):
         """
         This runs the reference Python function implementation
         (effectively calling `reference(*inputs)`, and compares that
         to the output of output, with an absolute/relative tolerance
         given by the `threshold` parameter.

         Useful for checking the implementation matches the Python
         (typically NumPy) implementation of the same functionality.

         Usage example:

             @given(X=hu.tensor(), inplace=st.booleans(), **hu.gcs)
             def test_softsign(self, X, inplace, gc, dc):
                 op = core.CreateOperator(
                     "Softsign", ["X"], ["X" if inplace else "Y"])

                 def softsign(X):
                     return (X / (1 + np.abs(X)),)

                 self.assertReferenceChecks(gc, op, [X], softsign)
         """
         if input_device_options is None:
             input_device_options = {}

         op = copy.deepcopy(op)
         op.device_option.CopyFrom(device_option)

         with temp_workspace():
             for (n, b) in zip(op.input, inputs):
                 workspace.FeedBlob(
                     n,
                     b,
                     device_option=input_device_options.get(n, device_option)
                 )
                 print("Input", n, input_device_options.get(n, device_option))
             net = core.Net("opnet")
             net.Proto().op.extend([op])
             test_shape_inference = False
             try:
                 (shapes, types) = workspace.InferShapesAndTypes([net])
                 test_shape_inference = True
             except RuntimeError as e:
                 # Temporarily catch runtime errors when inferring shape
                 # and type info
                 logging.warning(str(e))
                 if os.getenv('CAFFE2_ASSERT_SHAPEINFERENCE') == '1':
                     raise e
             workspace.RunNetOnce(net)
             reference_outputs = reference(*inputs)
             if not (isinstance(reference_outputs, tuple) or
                     isinstance(reference_outputs, list)):
                 raise RuntimeError(
                     "You are providing a wrong reference implementation. A "
                     "proper one should return a tuple/list of numpy arrays.")
             if not outputs_to_check:
                 self.assertEqual(len(reference_outputs), len(op.output))
                 outputs_to_check = range(len(op.output))
             outs = []
             for (output_index, ref) in zip(outputs_to_check, reference_outputs):
                 output_blob_name = op.output[output_index]
                 output = workspace.FetchBlob(output_blob_name)
                 if output.dtype.kind in ('S', 'O'):
                     np.testing.assert_array_equal(output, ref)
                 else:
                     if atol is None:
                         atol = threshold
                     np.testing.assert_allclose(
                         output, ref, atol=atol, rtol=threshold,
                         err_msg=(
                             'Output {0} is not matching the reference'.format(
                                 output_blob_name,
                             )),
                     )
                 if test_shape_inference:
                     self._assertInferTensorChecks(
                         output_blob_name, shapes, types, output)
                 outs.append(output)
             if grad_reference and output_to_grad:
                 with core.DeviceScope(device_option):
                     self._assertGradReferenceChecks(
                         op, inputs, reference_outputs,
                         output_to_grad, grad_reference)
             return outs

     def assertValidationChecks(
         self,
         device_option,
         op,
         inputs,
         validator,
         input_device_options=None,
         as_kwargs=True
     ):
         if input_device_options is None:
             input_device_options = {}
         if as_kwargs:
             assert len(set(list(op.input) + list(op.output))) == \
                 len(op.input) + len(op.output), \
                 "in-place ops are not supported in as_kwargs mode"
         op = copy.deepcopy(op)
         op.device_option.CopyFrom(device_option)

         with temp_workspace():
             for (n, b) in zip(op.input, inputs):
                 workspace.FeedBlob(
                     n,
                     b,
                     device_option=input_device_options.get(n, device_option)
                 )
             workspace.RunOperatorOnce(op)
             outputs = [workspace.FetchBlob(n) for n in op.output]
             if as_kwargs:
                 validator(**dict(zip(
                     list(op.input) + list(op.output), inputs + outputs)))
             else:
                 validator(inputs=inputs, outputs=outputs)
core.GradientRegistry.GetBackwardPass
def GetBackwardPass(cls, operators, ys)
Definition: core.py:949

workspace.ResetWorkspace
def ResetWorkspace(root_folder=None)
Definition: workspace.py:130

workspace.SwitchWorkspace
SwitchWorkspace
Definition: workspace.py:30

core.BlobReference
Definition: core.py:115

core.DeviceScope
DeviceScope
Definition: core.py:27

workspace.NumCudaDevices
NumCudaDevices
Definition: workspace.py:39

hypothesis_test_util.HypothesisTestCase
Definition: hypothesis_test_util.py:272

device_checker.DeviceChecker
Definition: device_checker.py:8

workspace.RunNetOnce
def RunNetOnce(net)
Definition: workspace.py:160

workspace.InferShapesAndTypes
def InferShapesAndTypes(nets, blob_dimensions=None)
Definition: workspace.py:184

test_util.TestCase
Definition: test_util.py:19

workspace.RunOperatorsOnce
def RunOperatorsOnce(operators)
Definition: workspace.py:152

core.Net
Definition: core.py:1119

workspace.CurrentWorkspace
CurrentWorkspace
Definition: workspace.py:24

workspace.BenchmarkNet
BenchmarkNet
Definition: workspace.py:33

gradient_checker.GradientChecker
Definition: gradient_checker.py:52

workspace.FeedBlob
def FeedBlob(name, arr, device_option=None)
Definition: workspace.py:229

hypothesis_test_util.HypothesisTestCase.assertGradientChecks
def assertGradientChecks(self, device_option, op, inputs, outputs_to_check, outputs_with_grads, grad_ops=None, threshold=0.005, stepsize=0.05, input_device_options=None)
Definition: hypothesis_test_util.py:321

workspace.CreateNet
def CreateNet(net, overwrite=False, input_blobs=None)
Definition: workspace.py:140

workspace.RunOperatorOnce
def RunOperatorOnce(operator)
Definition: workspace.py:148

workspace.FetchBlob
def FetchBlob(name)
Definition: workspace.py:276

hypothesis_test_util.HypothesisTestCase._assertInferTensorChecks
def _assertInferTensorChecks(self, name, shapes, types, output)
Definition: hypothesis_test_util.py:403

hypothesis_test_util.HypothesisTestCase.assertDeviceChecks
def assertDeviceChecks(self, device_options, op, inputs, outputs_to_check, input_device_options=None, threshold=0.01)
Definition: hypothesis_test_util.py:285

hypothesis_test_util.HypothesisTestCase._assertGradReferenceChecks
def _assertGradReferenceChecks(self, op, inputs, ref_outputs, output_to_grad, grad_reference, threshold=1e-4)
Definition: hypothesis_test_util.py:363

hypothesis_test_util.HypothesisTestCase.assertReferenceChecks
def assertReferenceChecks(self, device_option, op, inputs, reference, input_device_options=None, threshold=1e-4, output_to_grad=None, grad_reference=None, atol=None, outputs_to_check=None)
Definition: hypothesis_test_util.py:458