addition of time-profiling mode to unittest processing apparatus

88cc4d7e · Eric Larsen · Frederic · 272620f9 · 88cc4d7e · 88cc4d7e
--- a/bin/theano-nose
+++ b/bin/theano-nose
 #!/usr/bin/env python
-__authors__ = "Olivier Delalleau, Pascal Lamblin"
+__authors__ = "Olivier Delalleau, Pascal Lamblin, Eric Larsen"
 __contact__ = "delallea@iro"
 """
@@ -13,10 +13,40 @@ It is also used to load the KnownFailure plugin, in order to hide
 KnownFailureTests error messages. Use --without-knownfailure to
 disable that plugin.
-If the --batch option is used, it will call `run_tests_in_batch.py`,
+There are two additonal local options: '--batch[n=x]' and '--time-profile'.
-in order to run the tests by batches, not all at the same time.
-`run_tests_in_batch.py` will in turn call back this script in another
+If '--batch[n=x]' is used without '--time-profile', this script will call
-process.
+run_tests_in_batch.py` in order to run the tests by batches, not all at the
+same time. `run_tests_in_batch.py` will in turn call back this script in
+another process. The batches will comprise 100 elements each by default and
+x elements if the option 'n=x' is specified.
+If the '--time-profile' option is used, it will call `run_tests_in_batch.py`
+with the option time_profile=True to conduct time-profiling of the tests: Each
+test will be run and timed separately and the results will be deposited in the
+files 'timeprof_sort' and 'timeprof_nosort' whose location is specified in
+`run_tests_in_batch.py`. If the '--batch n=x' option is also specified,
+notification of the progresses will be made to standard output after every
+group of x tests.  Otherwise, notification will occur after every group of 100
+tests.
+The files 'timeprof_sort' and 'timeprof_nosort' both contain one record for
+each test and comprise the following fields:
+- test running-time
+- nosetests sequential test number
+- test name
+- name of class to which test belongs (if any), otherwise full
+  information is contained in test name
+- test outcome ('OK' or 'FAILED')
+In 'timeprof_sort', test records are sorted according to running-time whereas in
+'timeprof_nosort' records are sorted according to sequential number. The former
+classification is the main information source for time-profiling. Since tests
+belonging to same or close classes and files have close sequential numbers, the
+latter may be used to identify duration patterns among the tests. A full log is
+also saved as 'timeprof_rawlog''.
 """
 import logging
@@ -33,7 +63,6 @@ def main():
    batch_args = [arg for arg in sys.argv if arg.startswith('--batch')]
    for arg in batch_args:
        sys.argv.remove(arg)
    if len(batch_args):
        if len(batch_args) > 1:
            _logger.warn(
@@ -48,8 +77,19 @@ def main():
            # Use run_tests_in_batch's default
            batch_size = None
-        from theano.tests import run_tests_in_batch
+   # Handle --time_prof arguments
-        return run_tests_in_batch.main(batch_size=batch_size)
+    time_prof_args = [arg for arg in sys.argv if arg=='--time-profile']
+    for arg in time_prof_args:
+        sys.argv.remove(arg)
+    # Time-profiling and batch modes
+    from theano.tests import run_tests_in_batch
+    if len(time_prof_args) and len(batch_args):
+        return run_tests_in_batch.main(batch_size=batch_size, time_profile=True)
+    elif len(time_prof_args):
+        return run_tests_in_batch.main(batch_size=None, time_profile=True)
+    elif len(batch_args):
+        return run_tests_in_batch.main(batch_size=batch_size, time_profile=False)
    # Non-batch mode.
    addplugins = []
@@ -77,12 +117,41 @@ def help():
        KnownFailure plugin, in order to hide KnownFailureTests error
        messages. It also supports executing tests by batches.
-        Options:
+        Local options:
-            --batch[=n]: Do not run all the tests in one run, but split
+            --batch[=n]:
-                         the execution in batches of `n` tests each.
+                If specified without option '--time-profile'', do not run all
-                         Default n is 100.
+                the tests in one run, but split the execution in batches of
+                `n` tests each. Default n is 100.
+            --time-profile:
+                Each test will be run and timed separately and the results will
+                be deposited in the files 'timeprof_sort' and 'timeprof_nosort'
+                whose location is specified in 'run_tests_in_batch.py`. If the
+                '--batch n=x' option is also specified, notification of the
+                progresses will be made to standard output after every group of
+                x tests.  Otherwise, notification will occur after every group
+                of 100 tests.
+                The files 'timeprof_sort' and 'timeprof_nosort' both contain one
+                record for each test and comprise the following fields:
+                - test running-time
+                - nosetests sequential test number
+                - test name
+                - name of class to which test belongs (if any), otherwise full
+                  information is contained in test name
+                - name of class to which test belongs
+                - test outcome ('OK' or 'FAILED')
+                In 'timeprof_sort', test records are sorted according to
+                running-time whereas in 'timeprof_nosort' records are reported
+                according to sequential number. The former classification is the
+                main information source for time-profiling. Since tests belonging
+                to same or close classes and files have close sequential, the
+                latter may be used to identify duration patterns among the tests
+                numbers. A full log is also saved as 'timeprof_rawlog'.
            --help, -h: Displays this help.
            --without-knownfailure: Do not load the KnownFailure plugin.

--- a/theano/tests/run_tests_in_batch.py
+++ b/theano/tests/run_tests_in_batch.py
 #!/usr/bin/env python
+__authors__ = "Olivier Delalleau, Eric Larsen"
-__authors__   = "Olivier Delalleau"
+__contact__ = "delallea@iro"
-__contact__   = "delallea@iro"
 """
-Run this script to run tests in small batches rather than all at the same time.
+Run this script to run tests in small batches rather than all at the same time
+or to conduct time-profiling.
 If no argument is provided, then the whole Theano test-suite is run.
 Otherwise, only tests found in the directory given as argument are run.
-This script performs three tasks:
+If 'time_profile=False', this script performs three tasks:
    1. Run `nosetests --collect-only --with-id` to collect test IDs
-    2. Run `nosetests --with-id i1 ... iN` with batches of N indices, until all
+    2. Run `nosetests --with-id i1 ... iN` with batches of 'batch_size'
-       tests have been run (currently N=100).
+       indices,until all tests have been run (currently batch_size=100 by
+       default).
    3. Run `nosetests --failed` to re-run only tests that failed
        => The output of this 3rd step is the one you should care about
+If 'time_profile=True', this script conducts time-profiling of the tests:
+    1. Run `nosetests --collect-only --with-id` to collect test IDs
+    2. Run `nosetests --with-id i`, one test with ID 'i' at a time, collecting
+       timing information and displaying progresses on standard output after
+       every group of 'batch_size' (100 by default), until all tests have
+       been run.
+       The results are deposited in the files 'timeprof_sort' and
+       'timeprof_nosort'. Both contain one record for each test and comprise
+       the following fields:
+       - test running-time
+       - nosetests sequential test number
+       - test name
+       - name of class to which test belongs (if any), otherwise full
+         information is contained in test name
+       - test outcome ('OK' or 'FAILED')
+       In 'timeprof_sort', test records are sorted according to run-time
+       whereas in 'timeprof_nosort' records are reported according to
+       sequential number. The former classification is the main information
+       source for time-profiling.  Since tests belonging to same or close
+       classes and files have close sequential numbers, the latter may be used
+       to identify duration patterns among the tests. A full log is also saved
+       as 'timeprof_rawlog'.
 One reason to use this script is if you are a Windows user, and see errors like
 "Not enough storage is available to process this command" when trying to simply
 run `nosetests` in your Theano installation directory. This error is apparently
@@ -31,12 +54,16 @@ nosetests.
 """
-import cPickle, os, subprocess, sys
+import cPickle
+import os
+import subprocess
+import sys
+import datetime
 import theano
-def main(stdout=None, stderr=None, argv=None, theano_nose=None, batch_size=None):
+def main(stdout=None, stderr=None, argv=None, theano_nose=None,
+         batch_size=None, time_profile=False):
    """
    Run tests with optional output redirection.
@@ -58,7 +85,8 @@ def main(stdout=None, stderr=None, argv=None, theano_nose=None, batch_size=None)
    if argv is None:
        argv = sys.argv
    if theano_nose is None:
-        theano_nose = os.path.join(theano.__path__[0], '..', 'bin', 'theano-nose')
+        theano_nose = os.path.join(theano.__path__[0], '..',
+                                   'bin', 'theano-nose')
    if batch_size is None:
        batch_size = 100
    stdout_backup = sys.stdout
@@ -66,12 +94,13 @@ def main(stdout=None, stderr=None, argv=None, theano_nose=None, batch_size=None)
    try:
        sys.stdout = stdout
        sys.stderr = stderr
-        run(stdout, stderr, argv, theano_nose, batch_size)
+        run(stdout, stderr, argv, theano_nose, batch_size, time_profile)
    finally:
        sys.stdout = stdout_backup
        sys.stderr = stderr_backup
-def run(stdout, stderr, argv, theano_nose, batch_size):
+def run(stdout, stderr, argv, theano_nose, batch_size, time_profile):
    if len(argv) == 1:
        tests_dir = theano.__path__[0]
        other_args = []
@@ -84,6 +113,7 @@ def run(stdout, stderr, argv, theano_nose, batch_size):
    # It seems safer to fully regenerate the list of tests on each call.
    if os.path.isfile('.noseids'):
        os.remove('.noseids')
    # Collect test IDs.
    print """\
 ####################
@@ -97,11 +127,11 @@ def run(stdout, stderr, argv, theano_nose, batch_size):
    # Using sys.executable, so that the same Python version is used.
    python = sys.executable
    rval = subprocess.call(
-            ([python, theano_nose, '--collect-only', '--with-id']
+        ([python, theano_nose, '--collect-only', '--with-id']
-                + other_args),
+         + other_args),
-            stdin=dummy_in.fileno(),
+        stdin=dummy_in.fileno(),
-            stdout=stdout.fileno(),
+        stdout=stdout.fileno(),
-            stderr=stderr.fileno())
+        stderr=stderr.fileno())
    stdout.flush()
    stderr.flush()
    assert rval == 0
@@ -110,59 +140,167 @@ def run(stdout, stderr, argv, theano_nose, batch_size):
    ids = data['ids']
    n_tests = len(ids)
    assert n_tests == max(ids)
-    # Run tests.
-    failed = set()
+    # Standard batch testing is called for
-    print """\
+    if not time_profile:
+        failed = set()
+        print """\
 ###################################
-# RUNNING TESTS IN BATCHES OF %s #
+# RUNNING TESTS IN BATCHES OF %s  #
 ###################################""" % batch_size
-    for test_id in xrange(1, n_tests + 1, batch_size):
+        # We suppress all output because we want the user to focus only on
-        stdout.flush()
+        # the failed tests, which are re-run (with output) below.
-        stderr.flush()
-        test_range = range(test_id, min(test_id + batch_size, n_tests + 1))
-        # We suppress all output because we want the user to focus only on the
-        # failed tests, which are re-run (with output) below.
        dummy_out = open(os.devnull, 'w')
-        rval = subprocess.call(
+        for test_id in xrange(1, n_tests + 1, batch_size):
+            stdout.flush()
+            stderr.flush()
+            test_range = range(test_id, min(test_id + batch_size, n_tests + 1))
+            rval = subprocess.call(
                ([python, theano_nose, '-q', '--with-id']
-                    + map(str, test_range)
+                 + map(str, test_range)
-                    + other_args),
+                 + other_args),
                stdout=dummy_out.fileno(),
                stderr=dummy_out.fileno(),
                stdin=dummy_in.fileno())
-        # Recover failed test indices from the 'failed' field of the '.noseids'
+            # Recover failed test indices from the 'failed' field of the
-        # file. We need to do it after each batch because otherwise this field
+            # '.noseids' file. We need to do it after each batch because
-        # may get erased. We use a set because it seems like it is not
+            # otherwise this field  may get erased. We use a set because it
-        # systematically erased though, and we want to avoid duplicates.
+            # seems like it is not systematically erased though, and we want
-        failed = failed.union(cPickle.load(open(noseids_file, 'rb'))['failed'])
+            # to avoid duplicates.
-        print '%s%% done (failed: %s)' % ((test_range[-1] * 100) // n_tests,
+            failed = failed.union(cPickle.load(open(noseids_file, 'rb'))
-                                          len(failed))
+                                  ['failed'])
-    # Sort for cosmetic purpose only.
+            print '%s%% done (failed: %s)' % ((test_range[-1] * 100) //
-    failed = sorted(failed)
+                                n_tests, len(failed))
-    if failed:
+        # Sort for cosmetic purpose only.
-        # Re-run only failed tests
+        failed = sorted(failed)
-        print """\
+        if failed:
+            # Re-run only failed tests
+            print """\
 ################################
 # RE-RUNNING FAILED TESTS ONLY #
 ################################"""
-        stdout.flush()
+            stdout.flush()
-        stderr.flush()
+            stderr.flush()
-        subprocess.call(
+            subprocess.call(
                ([python, theano_nose, '-v', '--with-id']
-                    + failed
+                 + failed
-                    + other_args),
+                 + other_args),
                stdin=dummy_in.fileno(),
                stdout=stdout.fileno(),
                stderr=stderr.fileno())
-        stdout.flush()
+            stdout.flush()
-        stderr.flush()
+            stderr.flush()
-        return 0
+            return 0
-    else:
+        else:
-        print """\
+            print """\
 ####################
 # ALL TESTS PASSED #
 ####################"""
+    # Time-profiling is called for
+    else:
+        print """\
+########################################
+# RUNNING TESTS IN TIME-PROFILING MODE #
+########################################"""
+        # finds first word of list l containing string s
+        def getIndexOfFirst(l, s):
+            for pos, word in enumerate(l):
+                if s in word:
+                    return pos
+        # finds last word of list l containing string s
+        def getIndexOfLast(l, s):
+            for pos, word in enumerate(reversed(l)):
+                if s in word:
+                    return (len(l) - pos - 1)
+        # iterating through tests
+        # initializing master profiling list and raw log
+        prof_master_nosort = []
+        prof_rawlog = []
+        dummy_out = open(os.devnull, 'w')
+        for test_floor in xrange(1, n_tests + 1, batch_size):
+            for test_id in xrange(test_floor, min(test_floor + batch_size,
+                                                 n_tests + 1)):
+                proc = subprocess.Popen(
+                    ([python, theano_nose, '-v', '--with-id']
+                    + [str(test_id)] + other_args),
+                    stderr=subprocess.PIPE,
+                    stdout=dummy_out.fileno(),
+                    stdin=dummy_in.fileno())
+                # recovering and processing data from pipe
+                err = proc.stderr.read()
+                # building the raw log
+                prof_rawlog.append(err)
+                # parsing the output
+                l_err = err.split()
+                try:
+                    pos_id = getIndexOfFirst(l_err, '#')
+                    prof_id = l_err[pos_id]
+                    pos_dot = getIndexOfFirst(l_err, '...')
+                    prof_test = ''
+                    for s in l_err[pos_id + 1: pos_dot]:
+                        prof_test += s + ' '
+                    if 'OK' in err:
+                        pos_ok = getIndexOfLast(l_err, 'OK')
+                        prof_time = float(l_err[pos_ok - 1][0:-1])
+                        prof_pass = 'OK'
+                    else:
+                        prof_time = 0.
+                        prof_pass = 'FAILED TEST'
+                except:
+                    prof_time = 0
+                    prof_id = '#' + str(test_id)
+                    prof_test = ('FAILED PARSING, see raw log for details'
+                                'on test')
+                    prof_pass = ''
+                prof_tuple = (prof_time, prof_id, prof_test, prof_pass)
+                # appending tuple to master list
+                prof_master_nosort.append(prof_tuple)
+            print '%s%% time-profiled' % ((test_id * 100) // n_tests)
+        # sorting tests according to running-time
+        prof_master_sort = sorted(prof_master_nosort,
+                                  key=lambda test: test[0], reverse=True)
+        # saving results to readable files
+        path_nosort = os.path.join(theano.__path__[0], '..',
+                                   'bin', 'timeprof_nosort')
+        path_sort = os.path.join(theano.__path__[0], '..',
+                                   'bin', 'timeprof_sort')
+        path_rawlog = os.path.join(theano.__path__[0], '..',
+                                   'bin', 'timeprof_rawlog')
+        f_nosort = open(path_nosort, 'w')
+        f_sort = open(path_sort, 'w')
+        f_rawlog = open(path_rawlog, 'w')
+        stamp = str(datetime.datetime.now()) + '\n\n'
+        fields = ('Fields: computation time; nosetests sequential id;'
+                  ' test name; parent class (if any); outcome\n\n')
+        f_nosort.write('TIME-PROFILING OF THEANO\'S NOSETESTS'
+                       ' (by sequential id)\n\n' + stamp + fields)
+        f_sort.write('TIME-PROFILING OF THEANO\'S NOSETESTS'
+                     ' (sorted by computation time)\n\n' + stamp + fields)
+        for i in xrange(len(prof_master_nosort)):
+            s_nosort = ((str(prof_master_nosort[i][0]) + 's').ljust(10) +
+                 " " + prof_master_nosort[i][1].ljust(7) + " " +
+                 prof_master_nosort[i][2] + prof_master_nosort[i][3] +
+                 "\n")
+            f_nosort.write(s_nosort)
+            s_sort = ((str(prof_master_sort[i][0]) + 's').ljust(10) +
+                 " " + prof_master_sort[i][1].ljust(7) + " " +
+                 prof_master_sort[i][2] + prof_master_sort[i][3] +
+                 "\n")
+            f_sort.write(s_sort)
+        f_nosort.close()
+        f_sort.close()
+        f_rawlog.write('TIME-PROFILING OF THEANO\'S NOSETESTS'
+                ' (raw log)\n\n' + stamp)
+        for i in xrange(len(prof_rawlog)):
+            f_rawlog.write(prof_rawlog[i])
+        f_rawlog.close()
 if __name__ == '__main__':
    sys.exit(main())