lit: Add 'cd' support to the internal shell and port some tests

[oota-llvm.git] / utils / lit / lit / TestRunner.py
diff --git a/utils/lit/lit/TestRunner.py b/utils/lit/lit/TestRunner.py

index 548f6f532bcb169819e7f8f0d46a50ad0ea136cb..f1734eca37263f36ac060e1c42a59bd580836ee5 100644 (file)
--- a/utils/lit/lit/TestRunner.py
+++ b/utils/lit/lit/TestRunner.py
@@ -1,14 +1,13 @@
+from __future__ import absolute_import
  import os, signal, subprocess, sys
-import StringIO
-
-import ShUtil
-import Test
-import Util
-
+import re
  import platform
  import tempfile
  
-import re
+import lit.ShUtil as ShUtil
+import lit.Test as Test
+import lit.util
+from lit.util import to_bytes, to_string
  
  class InternalShellError(Exception):
      def __init__(self, command, message):
@@ -23,52 +22,56 @@ kUseCloseFDs = not kIsWindows
  # Use temporary files to replace /dev/null on Windows.
  kAvoidDevNull = kIsWindows
  
-def executeCommand(command, cwd=None, env=None):
-    # Close extra file handles on UNIX (on Windows this cannot be done while
-    # also redirecting input).
-    close_fds = not kIsWindows
+class ShellEnvironment(object):
  
-    p = subprocess.Popen(command, cwd=cwd,
-                         stdin=subprocess.PIPE,
-                         stdout=subprocess.PIPE,
-                         stderr=subprocess.PIPE,
-                         env=env, close_fds=close_fds)
-    out,err = p.communicate()
-    exitCode = p.wait()
+    """Mutable shell environment containing things like CWD and env vars.
  
-    # Detect Ctrl-C in subprocess.
-    if exitCode == -signal.SIGINT:
-        raise KeyboardInterrupt
+    Environment variables are not implemented, but cwd tracking is.
+    """
  
-    return out, err, exitCode
+    def __init__(self, cwd, env):
+        self.cwd = cwd
+        self.env = env
  
-def executeShCmd(cmd, cfg, cwd, results):
+def executeShCmd(cmd, shenv, results):
      if isinstance(cmd, ShUtil.Seq):
          if cmd.op == ';':
-            res = executeShCmd(cmd.lhs, cfg, cwd, results)
-            return executeShCmd(cmd.rhs, cfg, cwd, results)
+            res = executeShCmd(cmd.lhs, shenv, results)
+            return executeShCmd(cmd.rhs, shenv, results)
  
          if cmd.op == '&':
              raise InternalShellError(cmd,"unsupported shell operator: '&'")
  
          if cmd.op == '||':
-            res = executeShCmd(cmd.lhs, cfg, cwd, results)
+            res = executeShCmd(cmd.lhs, shenv, results)
              if res != 0:
-                res = executeShCmd(cmd.rhs, cfg, cwd, results)
+                res = executeShCmd(cmd.rhs, shenv, results)
              return res
  
          if cmd.op == '&&':
-            res = executeShCmd(cmd.lhs, cfg, cwd, results)
+            res = executeShCmd(cmd.lhs, shenv, results)
              if res is None:
                  return res
  
              if res == 0:
-                res = executeShCmd(cmd.rhs, cfg, cwd, results)
+                res = executeShCmd(cmd.rhs, shenv, results)
              return res
  
          raise ValueError('Unknown shell command: %r' % cmd.op)
-
      assert isinstance(cmd, ShUtil.Pipeline)
+
+    # Handle shell builtins first.
+    if cmd.commands[0].args[0] == 'cd':
+        # Update the cwd in the environment.
+        if len(cmd.commands[0].args) != 2:
+            raise ValueError('cd supports only one argument')
+        newdir = cmd.commands[0].args[1]
+        if os.path.isabs(newdir):
+            shenv.cwd = newdir
+        else:
+            shenv.cwd = os.path.join(shenv.cwd, newdir)
+        return 0
+
      procs = []
      input = subprocess.PIPE
      stderrTempFiles = []
@@ -122,7 +125,9 @@ def executeShCmd(cmd, cfg, cwd, results):
                      if kAvoidDevNull and r[0] == '/dev/null':
                          r[2] = tempfile.TemporaryFile(mode=r[1])
                      else:
-                        r[2] = open(r[0], r[1])
+                        # Make sure relative paths are relative to the cwd.
+                        redir_filename = os.path.join(shenv.cwd, r[0])
+                        r[2] = open(redir_filename, r[1])
                      # Workaround a Win32 and/or subprocess bug when appending.
                      #
                      # FIXME: Actually, this is probably an instance of PR6753.
@@ -152,8 +157,8 @@ def executeShCmd(cmd, cfg, cwd, results):
  
          # Resolve the executable path ourselves.
          args = list(j.args)
-        args[0] = Util.which(args[0], cfg.environment['PATH'])
-        if not args[0]:
+        executable = lit.util.which(args[0], shenv.env['PATH'])
+        if not executable:
              raise InternalShellError(j, '%r: command not found' % j.args[0])
  
          # Replace uses of /dev/null with temporary files.
@@ -165,12 +170,16 @@ def executeShCmd(cmd, cfg, cwd, results):
                      named_temp_files.append(f.name)
                      args[i] = f.name
  
-        procs.append(subprocess.Popen(args, cwd=cwd,
-                                      stdin = stdin,
-                                      stdout = stdout,
-                                      stderr = stderr,
-                                      env = cfg.environment,
-                                      close_fds = kUseCloseFDs))
+        try:
+            procs.append(subprocess.Popen(args, cwd=shenv.cwd,
+                                          executable = executable,
+                                          stdin = stdin,
+                                          stdout = stdout,
+                                          stderr = stderr,
+                                          env = shenv.env,
+                                          close_fds = kUseCloseFDs))
+        except OSError as e:
+            raise InternalShellError(j, 'Could not create process due to {}'.format(e))
  
          # Immediately close stdin for any process taking stdin from us.
          if stdin == subprocess.PIPE:
@@ -212,6 +221,11 @@ def executeShCmd(cmd, cfg, cwd, results):
          f.seek(0, 0)
          procData[i] = (procData[i][0], f.read())
  
+    def to_string(bytes):
+        if isinstance(bytes, str):
+            return bytes
+        return bytes.encode('utf-8')
+
      exitCode = None
      for i,(out,err) in enumerate(procData):
          res = procs[i].wait()
@@ -219,10 +233,22 @@ def executeShCmd(cmd, cfg, cwd, results):
          if res == -signal.SIGINT:
              raise KeyboardInterrupt
  
+        # Ensure the resulting output is always of string type.
+        try:
+            out = to_string(out.decode('utf-8'))
+        except:
+            out = str(out)
+        try:
+            err = to_string(err.decode('utf-8'))
+        except:
+            err = str(err)
+
          results.append((cmd.commands[i], out, err, res))
          if cmd.pipe_err:
              # Python treats the exit code as a signed char.
-            if res < 0:
+            if exitCode is None:
+                exitCode = res
+            elif res < 0:
                  exitCode = min(exitCode, res)
              else:
                  exitCode = max(exitCode, res)
@@ -248,7 +274,7 @@ def executeScriptInternal(test, litConfig, tmpBase, commands, cwd):
              cmds.append(ShUtil.ShParser(ln, litConfig.isWindows,
                                          test.config.pipefail).parse())
          except:
-            return (Test.FAIL, "shell parser error on: %r" % ln)
+            return lit.Test.Result(Test.FAIL, "shell parser error on: %r" % ln)
  
      cmd = cmds[0]
      for c in cmds[1:]:
@@ -256,8 +282,10 @@ def executeScriptInternal(test, litConfig, tmpBase, commands, cwd):
  
      results = []
      try:
-        exitCode = executeShCmd(cmd, test.config, cwd, results)
-    except InternalShellError,e:
+        shenv = ShellEnvironment(cwd, test.config.environment)
+        exitCode = executeShCmd(cmd, shenv, results)
+    except InternalShellError:
+        e = sys.exc_info()[1]
          exitCode = 127
          results.append((e.command, '', e.message, exitCode))
  
@@ -303,30 +331,71 @@ def executeScript(test, litConfig, tmpBase, commands, cwd):
              # run on clang with no real loss.
              command = litConfig.valgrindArgs + command
  
-    return executeCommand(command, cwd=cwd, env=test.config.environment)
+    return lit.util.executeCommand(command, cwd=cwd,
+                                   env=test.config.environment)
+
+def parseIntegratedTestScriptCommands(source_path):
+    """
+    parseIntegratedTestScriptCommands(source_path) -> commands
+
+    Parse the commands in an integrated test script file into a list of
+    (line_number, command_type, line).
+    """
  
-def isExpectedFail(test, xfails):
-    # Check if any of the xfails match an available feature or the target.
-    for item in xfails:
-        # If this is the wildcard, it always fails.
-        if item == '*':
-            return True
+    # This code is carefully written to be dual compatible with Python 2.5+ and
+    # Python 3 without requiring input files to always have valid codings. The
+    # trick we use is to open the file in binary mode and use the regular
+    # expression library to find the commands, with it scanning strings in
+    # Python2 and bytes in Python3.
+    #
+    # Once we find a match, we do require each script line to be decodable to
+    # UTF-8, so we convert the outputs to UTF-8 before returning. This way the
+    # remaining code can work with "strings" agnostic of the executing Python
+    # version.
  
-        # If this is an exact match for one of the features, it fails.
-        if item in test.config.available_features:
-            return True
+    keywords = ['RUN:', 'XFAIL:', 'REQUIRES:', 'UNSUPPORTED:', 'END.']
+    keywords_re = re.compile(
+        to_bytes("(%s)(.*)\n" % ("|".join(k for k in keywords),)))
  
-        # If this is a part of the target triple, it fails.
-        if item in test.suite.config.target_triple:
-            return True
+    f = open(source_path, 'rb')
+    try:
+        # Read the entire file contents.
+        data = f.read()
+
+        # Ensure the data ends with a newline.
+        if not data.endswith(to_bytes('\n')):
+            data = data + to_bytes('\n')
+
+        # Iterate over the matches.
+        line_number = 1
+        last_match_position = 0
+        for match in keywords_re.finditer(data):
+            # Compute the updated line number by counting the intervening
+            # newlines.
+            match_position = match.start()
+            line_number += data.count(to_bytes('\n'), last_match_position,
+                                      match_position)
+            last_match_position = match_position
+
+            # Convert the keyword and line to UTF-8 strings and yield the
+            # command. Note that we take care to return regular strings in
+            # Python 2, to avoid other code having to differentiate between the
+            # str and unicode types.
+            keyword,ln = match.groups()
+            yield (line_number, to_string(keyword[:-1].decode('utf-8')),
+                   to_string(ln.decode('utf-8')))
+    finally:
+        f.close()
  
-    return False
  
  def parseIntegratedTestScript(test, normalize_slashes=False,
-                              extra_substitutions=[]):
+                              extra_substitutions=[], require_script=True):
      """parseIntegratedTestScript - Scan an LLVM/Clang style integrated test
      script and extract the lines to 'RUN' as well as 'XFAIL' and 'REQUIRES'
-    information. The RUN lines also will have variable substitution performed.
+    and 'UNSUPPORTED' information. The RUN lines also will have variable
+    substitution performed. If 'require_script' is False an empty script may be
+    returned. This can be used for test formats where the actual script is
+    optional or ignored.
      """
  
      # Get the temporary location, this is always relative to the test suite
@@ -339,8 +408,6 @@ def parseIntegratedTestScript(test, normalize_slashes=False,
      execdir,execbase = os.path.split(execpath)
      tmpDir = os.path.join(execdir, 'Output')
      tmpBase = os.path.join(tmpDir, execbase)
-    if test.index is not None:
-        tmpBase += '_%d' % test.index
  
      # Normalize slashes, if requested.
      if normalize_slashes:
@@ -361,18 +428,22 @@ def parseIntegratedTestScript(test, normalize_slashes=False,
                            ('%T', tmpDir),
                            ('#_MARKER_#', '%')])
  
+    # "%/[STpst]" should be normalized.
+    substitutions.extend([
+            ('%/s', sourcepath.replace('\\', '/')),
+            ('%/S', sourcedir.replace('\\', '/')),
+            ('%/p', sourcedir.replace('\\', '/')),
+            ('%/t', tmpBase.replace('\\', '/') + '.tmp'),
+            ('%/T', tmpDir.replace('\\', '/')),
+            ])
+
      # Collect the test lines from the script.
      script = []
-    xfails = []
      requires = []
-    line_number = 0
-    for ln in open(sourcepath):
-        line_number += 1
-        if 'RUN:' in ln:
-            # Isolate the command to run.
-            index = ln.index('RUN:')
-            ln = ln[index+4:]
-
+    unsupported = []
+    for line_number, command_type, ln in \
+            parseIntegratedTestScriptCommands(sourcepath):
+        if command_type == 'RUN':
              # Trim trailing whitespace.
              ln = ln.rstrip()
  
@@ -390,16 +461,19 @@ def parseIntegratedTestScript(test, normalize_slashes=False,
                  script[-1] = script[-1][:-1] + ln
              else:
                  script.append(ln)
-        elif 'XFAIL:' in ln:
-            items = ln[ln.index('XFAIL:') + 6:].split(',')
-            xfails.extend([s.strip() for s in items])
-        elif 'REQUIRES:' in ln:
-            items = ln[ln.index('REQUIRES:') + 9:].split(',')
-            requires.extend([s.strip() for s in items])
-        elif 'END.' in ln:
-            # Check for END. lines.
-            if ln[ln.index('END.'):].strip() == 'END.':
+        elif command_type == 'XFAIL':
+            test.xfails.extend([s.strip() for s in ln.split(',')])
+        elif command_type == 'REQUIRES':
+            requires.extend([s.strip() for s in ln.split(',')])
+        elif command_type == 'UNSUPPORTED':
+            unsupported.extend([s.strip() for s in ln.split(',')])
+        elif command_type == 'END':
+            # END commands are only honored if the rest of the line is empty.
+            if not ln.strip():
                  break
+        else:
+            raise ValueError("unknown script command type: %r" % (
+                    command_type,))
  
      # Apply substitutions to the script.  Allow full regular
      # expression syntax.  Replace each matching occurrence of regular
@@ -413,83 +487,76 @@ def parseIntegratedTestScript(test, normalize_slashes=False,
  
          # Strip the trailing newline and any extra whitespace.
          return ln.strip()
-    script = map(processLine, script)
+    script = [processLine(ln)
+              for ln in script]
  
      # Verify the script contains a run line.
-    if not script:
-        return (Test.UNRESOLVED, "Test has no run line!")
+    if require_script and not script:
+        return lit.Test.Result(Test.UNRESOLVED, "Test has no run line!")
  
      # Check for unterminated run lines.
-    if script[-1][-1] == '\\':
-        return (Test.UNRESOLVED, "Test has unterminated run lines (with '\\')")
+    if script and script[-1][-1] == '\\':
+        return lit.Test.Result(Test.UNRESOLVED,
+                               "Test has unterminated run lines (with '\\')")
  
      # Check that we have the required features:
      missing_required_features = [f for f in requires
                                   if f not in test.config.available_features]
      if missing_required_features:
          msg = ', '.join(missing_required_features)
-        return (Test.UNSUPPORTED,
-                "Test requires the following features: %s" % msg)
-
-    isXFail = isExpectedFail(test, xfails)
-    return script,isXFail,tmpBase,execdir
-
-def formatTestOutput(status, out, err, exitCode, script):
-    output = StringIO.StringIO()
-    print >>output, "Script:"
-    print >>output, "--"
-    print >>output, '\n'.join(script)
-    print >>output, "--"
-    print >>output, "Exit Code: %r" % exitCode,
-    print >>output
-    if out:
-        print >>output, "Command Output (stdout):"
-        print >>output, "--"
-        output.write(out)
-        print >>output, "--"
-    if err:
-        print >>output, "Command Output (stderr):"
-        print >>output, "--"
-        output.write(err)
-        print >>output, "--"
-    return (status, output.getvalue())
-
-def executeShTest(test, litConfig, useExternalSh,
-                  extra_substitutions=[]):
-    if test.config.unsupported:
-        return (Test.UNSUPPORTED, 'Test is unsupported')
-
-    res = parseIntegratedTestScript(test, useExternalSh, extra_substitutions)
-    if len(res) == 2:
-        return res
-
-    script, isXFail, tmpBase, execdir = res
-
+        return lit.Test.Result(Test.UNSUPPORTED,
+                               "Test requires the following features: %s" % msg)
+    unsupported_features = [f for f in unsupported
+                            if f in test.config.available_features]
+    if unsupported_features:
+        msg = ', '.join(unsupported_features)
+        return lit.Test.Result(Test.UNSUPPORTED,
+                    "Test is unsupported with the following features: %s" % msg)
+
+    return script,tmpBase,execdir
+
+def _runShTest(test, litConfig, useExternalSh,
+                   script, tmpBase, execdir):
      # Create the output directory if it does not already exist.
-    Util.mkdir_p(os.path.dirname(tmpBase))
+    lit.util.mkdir_p(os.path.dirname(tmpBase))
  
      if useExternalSh:
          res = executeScript(test, litConfig, tmpBase, script, execdir)
      else:
          res = executeScriptInternal(test, litConfig, tmpBase, script, execdir)
-    if len(res) == 2:
+    if isinstance(res, lit.Test.Result):
          return res
  
      out,err,exitCode = res
-    if isXFail:
-        ok = exitCode != 0
-        if ok:
-            status = Test.XFAIL
-        else:
-            status = Test.XPASS
+    if exitCode == 0:
+        status = Test.PASS
      else:
-        ok = exitCode == 0
-        if ok:
-            status = Test.PASS
-        else:
-            status = Test.FAIL
+        status = Test.FAIL
+
+    # Form the output log.
+    output = """Script:\n--\n%s\n--\nExit Code: %d\n\n""" % (
+        '\n'.join(script), exitCode)
+
+    # Append the outputs, if present.
+    if out:
+        output += """Command Output (stdout):\n--\n%s\n--\n""" % (out,)
+    if err:
+        output += """Command Output (stderr):\n--\n%s\n--\n""" % (err,)
+
+    return lit.Test.Result(status, output)
+
+
+def executeShTest(test, litConfig, useExternalSh,
+                  extra_substitutions=[]):
+    if test.config.unsupported:
+        return (Test.UNSUPPORTED, 'Test is unsupported')
+
+    res = parseIntegratedTestScript(test, useExternalSh, extra_substitutions)
+    if isinstance(res, lit.Test.Result):
+        return res
+    if litConfig.noExecute:
+        return lit.Test.Result(Test.PASS)
  
-    if ok:
-        return (status,'')
+    script, tmpBase, execdir = res
+    return _runShTest(test, litConfig, useExternalSh, script, tmpBase, execdir)
  
-    return formatTestOutput(status, out, err, exitCode, script)