Remove test.record and dependencies

This "record" functionality was only used by some rather poor tests that also needed to be removed.

Remove test.record and dependencies
00b4aed2 · Brandon T. Willard · Brandon T. Willard · 4a539e47 · 4a539e47 · 4a539e47
--- a/tests/record.py
+++ b/tests/record.py
-from aesara.compile.mode import Mode
-from aesara.configdefaults import config
-from aesara.link.basic import WrapLinkerMany
-from aesara.link.vm import VMLinker
-from aesara.printing import hex_digest, min_informative_str
-
-
-__authors__ = ["PyMC Team", "Ian Goodfellow", "Aesara Developers"]
-
-
-class MismatchError(Exception):
-    """
-    Raised by Record.handle_line when the
-    current execution doesn't match the replay
-    of a record.
-    """
-
-
-class Record:
-    """
-    Records a sequence of strings (from a string buffer). These can then be
-    compared to another sequence of strings, and if the two sequences don't
-    match a mismatch exception is raised.
-
-    Example:
-       # Create a Record object and store 'hello world' inside it
-       output = cStringIO.StringIO()
-       recorder = Record(file_object=output, replay=False)
-       recorder.handle_line('hello world \n')
-
-       # Store the previous output
-       output_value = output.getvalue()
-       output = cStringIO.StringIO(output_value)
-
-       # Create another Record object, now in playback mode, and set
-       # it to the previous sequence of strings
-       playback_checker = Record(file_object=output,  replay=True)
-
-       # Check if it matches the previous one
-       playback_checker.handle_line('hello world \n')
-
-       # Now check if it the next item matches something else. This will
-       # throw an exception because there is no next item
-       playback_checker.handle_line('hello new world \n')
-    """
-
-    def __init__(self, file_object=None, file_path=None, replay=False):
-        """
-        Initializes Record object to use file on disc and whether it is in
-        replay mode or not.
-
-        Parameters
-        ----------
-        file_object : StringIO
-            The input string buffer.
-        file_path : string, optional
-            File to save Record to.
-        replay : bool, optional
-            Determines whether or not the object is in playback mode. If not
-            in playback mode, the content of record will be written to the
-            file. If in playback mode, the content of file is loaded into the
-            record.
-        """
-
-        assert file_object is not None or file_path is not None
-
-        if replay and file_object is None:
-            self.f = open(file_path)
-        elif (not replay) and file_object is None:
-            self.f = open(file_path, "w")
-        else:
-            self.f = file_object
-
-        self.__dict__.update(locals())
-
-    def handle_line(self, line):
-        """
-        If not in playback mode, it records a new string. If in playback mode,
-        it compares the current string to the next element in the sequence.
-        If these are identical the element is removed and otherwise a mismatch
-        exception is raised.
-
-        Parameters
-        ----------
-        line : string
-            The string to record.
-        """
-
-        assert line.endswith("\n")
-        assert line[:-2].find("\n") == -1
-        if self.replay:
-            old_line = self.f.readline()
-            if old_line != line:
-                msg = "Replay detected mismatch.\n"
-                msg += " I wanted to write:\n"
-                if len(line) > 100:
-                    msg += line[0:100] + "..."
-                else:
-                    msg += line
-                msg += "\nwhen previous job wrote:\n"
-                if len(old_line) > 100:
-                    msg += old_line[0:100] + "..."
-                else:
-                    msg += old_line
-                raise MismatchError(msg)
-        else:
-            self.f.write(line)
-
-
-class RecordMode(Mode):
-    """
-    Records all computations done with a function in a file at output_path.
-    Writes into the file the index of each apply node and sha256 digests of the
-    numpy ndarrays it receives as inputs and produces as output.
-
-    Example:
-       # We use RecordMode to test that the computation of a function is
-       identical. Create a Record object and use it to initialize a
-       RecordMode object.
-       output = cStringIO.StringIO()
-       record = Record(file_object=output, replay=False)
-       record_mode = RecordMode(record)
-
-       # Then compile and call the function you wish to test, which uses
-       # Apply nodes with record_mode as first parameter to record all the
-       # computations to file. For example, call an Aesara function with the
-       # RecordMode object.
-       x = aesara.tensor.dscalar()
-       f = aesara.function([x], 2*x, mode=record_mode)
-       print f(4)
-
-       # Create another RecordMode object and initialize it with the previous
-       # record.
-       output = cStringIO.StringIO(output.getvalue())
-       playback = Record(file_object=output, replay=True)
-       playback_mode = RecordMode(playback)
-
-       # Compile and call the function to test again with record_mode as
-       # first parameter. An exception will be thrown if the recorded
-       # computations are not identical between the two runs.
-       x = aesara.tensor.dscalar()
-       f = aesara.function([x], 2*x, mode=playback_mode)
-       print f(4)
-
-    """
-
-    def set_record(self, record):
-        """
-        Configure object to use an existing Record object.
-
-        Parameters
-        ----------
-        record : Record
-            The Record object to use.
-        """
-
-        self.record = record
-        self.known_fgraphs = set()
-
-    def __init__(self, record=None, db=None, **kwargs):
-        """
-        Takes either a Record object or the keyword arguments to make one.
-
-        Parameters
-        ----------
-        record : Record
-            The existing Record object to use.
-        kwargs : pointer?
-            Keyword arguments to construct new object.
-        """
-
-        if record is None:
-            record = Record(**kwargs)
-        else:
-            assert len(kwargs.keys()) == 0
-
-        self.set_record(record)
-
-        def handle_line(fgraph, line, i, node, fn):
-            """
-            Records new node computation.
-
-            Parameters
-            ----------
-            line : string
-                Line to record. For example, the function name or node name.
-            i : integer
-                Node number in the toposort order.
-            node : Apply,
-                The Apply node which created the entry.
-            fn : Function,
-                Function related to Apply node.
-            """
-            try:
-                self.record.handle_line(line)
-            except MismatchError as e:
-                print("Got this MismatchError:")
-                print(e)
-                print(f"while processing node i={i}:")
-                print(f"str(node):{node}")
-                print("Symbolic inputs: ")
-                for elem in node.inputs:
-                    print(min_informative_str(elem))
-                print("str(output) of outputs: ")
-                for elem in fn.outputs:
-                    assert isinstance(elem, list)
-                    (elem,) = elem
-                    print(str(elem))
-                print(f"function name: {fgraph.name}")
-                raise MismatchError("Non-determinism detected by WrapLinker")
-
-        def callback(fgraph, i, node, fn):
-            """
-            Function called by Apply nodes at the end of each computation?
-            """
-
-            if fgraph.name is None:
-                raise ValueError(
-                    "Un-named functions are not allowed with RecordMode, "
-                    "because they make it impossible to tell if the same function is "
-                    "running during the playback."
-                )
-
-            if fgraph not in self.known_fgraphs:
-                assert not any(elem.name == fgraph.name for elem in self.known_fgraphs)
-                self.known_fgraphs.add(fgraph)
-                num_app = len(fgraph.apply_nodes)
-                line = f"Function {fgraph.name} has {num_app} apply nodes.\n"
-                handle_line(fgraph, line, i, node, fn)
-
-            line = f"Function name: {fgraph.name}\n"
-            handle_line(fgraph, line, i, node, fn)
-            line = f"Node {i}:{node}\n"
-            handle_line(fgraph, line, i, node, fn)
-            assert all(isinstance(x, list) and len(x) == 1 for x in fn.inputs)
-
-            def digest(x):
-                x = x[0]
-                return hex_digest(x)
-
-            inputs_digest = " ".join([digest(x) for x in fn.inputs])
-            line = f"Inputs: {inputs_digest}\n"
-            handle_line(fgraph, line, i, node, fn)
-            fn()
-            outputs_digest = " ".join([digest(x) for x in fn.outputs])
-            line = f"Outputs: {outputs_digest}\n"
-            handle_line(fgraph, line, i, node, fn)
-
-        # linker = aesara.link.c.basic.OpWiseCLinker()
-        linker = VMLinker(use_cloop=bool(config.cxx))
-
-        wrap_linker = WrapLinkerMany([linker], [callback])
-        super().__init__(linker=wrap_linker, optimizer="fast_run", db=db)
--- a/tests/test_determinism.py
+++ b/tests/test_determinism.py
-from collections import OrderedDict
-from datetime import datetime
-from io import StringIO
-
-import numpy as np
-
-from aesara.compile import shared
-from aesara.compile.function import function
-from aesara.configdefaults import config
-from aesara.graph import basic
-from aesara.printing import var_descriptor
-from tests.record import Record, RecordMode
-
-
-__authors__ = "Ian Goodfellow " "PyMC Developers " "Aesara Developers "
-__license__ = "3-clause BSD"
-
-
-def disturb_mem():
-    # Allocate a time-dependent amount of objects to increase
-    # chances of subsequently objects' ids changing from run
-    # to run. This is useful for exposing issues that cause
-    # non-deterministic behavior due to dependence on memory
-    # addresses, like iterating over a dict or a set.
-    global l
-    now = datetime.now()
-    ms = now.microsecond
-    ms = int(ms)
-    n = ms % 1000
-    m = ms // 1000
-    l = [[0] * m for i in range(n)]
-
-
-def sharedX(x, name=None):
-    x = np.cast[config.floatX](x)
-    return shared(x, name)
-
-
-def test_determinism_1():
-    # FIXME: This is a poor test.
-
-    # Tests that repeatedly running a script that compiles and
-    # runs a function does exactly the same thing every time it
-    # is run, even when the memory addresses of the objects involved
-    # change.
-    # This specific script is capable of catching a bug where
-    # FunctionGraph.toposort was non-deterministic.
-
-    def run(replay, log=None):
-
-        if not replay:
-            log = StringIO()
-        else:
-            log = StringIO(log)
-        record = Record(replay=replay, file_object=log)
-
-        disturb_mem()
-
-        mode = RecordMode(record=record)
-
-        b = sharedX(np.zeros((2,)), name="b")
-        channels = OrderedDict()
-
-        disturb_mem()
-
-        v_max = b.max(axis=0)
-        v_min = b.min(axis=0)
-        v_range = v_max - v_min
-
-        updates = []
-        for i, val in enumerate(
-            [
-                v_max.max(),
-                v_max.min(),
-                v_range.max(),
-            ]
-        ):
-            disturb_mem()
-            s = sharedX(0.0, name="s_" + str(i))
-            updates.append((s, val))
-
-        for var in basic.ancestors(update for _, update in updates):
-            if var.name is not None and var.name != "b":
-                if var.name[0] != "s" or len(var.name) != 2:
-                    var.name = None
-
-        for key in channels:
-            updates.append((s, channels[key]))
-        f = function([], mode=mode, updates=updates, on_unused_input="ignore", name="f")
-        for output in f.maker.fgraph.outputs:
-            mode.record.handle_line(var_descriptor(output) + "\n")
-        disturb_mem()
-        f()
-
-        mode.record.f.flush()
-
-        if not replay:
-            return log.getvalue()
-
-    log = run(0)
-    # Do several trials, since failure doesn't always occur
-    # (Sometimes you sample the same outcome twice in a row)
-    for i in range(10):
-        run(1, log)
--- a/tests/test_record.py
+++ b/tests/test_record.py
-from io import StringIO
-
-from aesara import function
-from aesara.tensor.type import iscalar
-from tests.record import MismatchError, Record, RecordMode
-
-
-def test_record_good():
-    # Tests that when we record a sequence of events, then
-    # repeat it exactly, the Record class:
-    #     1) Records it correctly
-    #     2) Does not raise any errors
-
-    # Record a sequence of events
-    output = StringIO()
-
-    recorder = Record(file_object=output, replay=False)
-
-    num_lines = 10
-
-    for i in range(num_lines):
-        recorder.handle_line(str(i) + "\n")
-
-    # Make sure they were recorded correctly
-    output_value = output.getvalue()
-
-    assert output_value == "".join(str(i) + "\n" for i in range(num_lines))
-
-    # Make sure that the playback functionality doesn't raise any errors
-    # when we repeat them
-    output = StringIO(output_value)
-
-    playback_checker = Record(file_object=output, replay=True)
-
-    for i in range(num_lines):
-        playback_checker.handle_line(str(i) + "\n")
-
-
-def test_record_bad():
-    # Tests that when we record a sequence of events, then
-    # do something different on playback, the Record class catches it.
-
-    # Record a sequence of events
-    output = StringIO()
-
-    recorder = Record(file_object=output, replay=False)
-
-    num_lines = 10
-
-    for i in range(num_lines):
-        recorder.handle_line(str(i) + "\n")
-
-    # Make sure that the playback functionality doesn't raise any errors
-    # when we repeat some of them
-    output_value = output.getvalue()
-    output = StringIO(output_value)
-
-    playback_checker = Record(file_object=output, replay=True)
-
-    for i in range(num_lines // 2):
-        playback_checker.handle_line(str(i) + "\n")
-
-    # Make sure it raises an error when we deviate from the recorded sequence
-    try:
-        playback_checker.handle_line("0\n")
-    except MismatchError:
-        return
-    raise AssertionError(
-        "Failed to detect mismatch between recorded sequence " " and repetition of it."
-    )
-
-
-def test_record_mode_good():
-    # Like test_record_good, but some events are recorded by the
-    # aesara RecordMode. We don't attempt to check the
-    # exact string value of the record in this case.
-
-    # Record a sequence of events
-    output = StringIO()
-
-    recorder = Record(file_object=output, replay=False)
-
-    record_mode = RecordMode(recorder)
-
-    i = iscalar()
-    f = function([i], i, mode=record_mode, name="f")
-
-    num_lines = 10
-
-    for i in range(num_lines):
-        recorder.handle_line(str(i) + "\n")
-        f(i)
-
-    # Make sure that the playback functionality doesn't raise any errors
-    # when we repeat them
-    output_value = output.getvalue()
-    output = StringIO(output_value)
-
-    playback_checker = Record(file_object=output, replay=True)
-
-    playback_mode = RecordMode(playback_checker)
-
-    i = iscalar()
-    f = function([i], i, mode=playback_mode, name="f")
-
-    for i in range(num_lines):
-        playback_checker.handle_line(str(i) + "\n")
-        f(i)
-
-
-def test_record_mode_bad():
-    # Like test_record_bad, but some events are recorded by the
-    # aesara RecordMode, as is the event that triggers the mismatch
-    # error.
-
-    # Record a sequence of events
-    output = StringIO()
-
-    recorder = Record(file_object=output, replay=False)
-
-    record_mode = RecordMode(recorder)
-
-    i = iscalar()
-    f = function([i], i, mode=record_mode, name="f")
-
-    num_lines = 10
-
-    for i in range(num_lines):
-        recorder.handle_line(str(i) + "\n")
-        f(i)
-
-    # Make sure that the playback functionality doesn't raise any errors
-    # when we repeat them
-    output_value = output.getvalue()
-    output = StringIO(output_value)
-
-    playback_checker = Record(file_object=output, replay=True)
-
-    playback_mode = RecordMode(playback_checker)
-
-    i = iscalar()
-    f = function([i], i, mode=playback_mode, name="f")
-
-    for i in range(num_lines // 2):
-        playback_checker.handle_line(str(i) + "\n")
-        f(i)
-
-    # Make sure a wrong event causes a MismatchError
-    try:
-        f(0)
-    except MismatchError:
-        return
-    raise AssertionError("Failed to detect a mismatch.")