Revert r188376, "[lit] Support parsing scripts with inconsistent or invalid encodings...

[oota-llvm.git] / utils / lit / lit / TestRunner.py
diff --git a/utils/lit/lit/TestRunner.py b/utils/lit/lit/TestRunner.py

index 29adff2229839f4b1656cfa0cd1eb0e0917e372d..068e4991b2110a67a5168021deed1c92688f726e 100644 (file)
--- a/utils/lit/lit/TestRunner.py
+++ b/utils/lit/lit/TestRunner.py
@@ -1,38 +1,25 @@
+from __future__ import absolute_import
  import os, signal, subprocess, sys
-import StringIO
-
-import ShUtil
-import Test
-import Util
-
+import re
  import platform
  import tempfile
  
+import lit.ShUtil as ShUtil
+import lit.Test as Test
+import lit.util
+
  class InternalShellError(Exception):
      def __init__(self, command, message):
          self.command = command
          self.message = message
  
+kIsWindows = platform.system() == 'Windows'
+
  # Don't use close_fds on Windows.
-kUseCloseFDs = platform.system() != 'Windows'
+kUseCloseFDs = not kIsWindows
  
  # Use temporary files to replace /dev/null on Windows.
-kAvoidDevNull = platform.system() == 'Windows'
-
-def executeCommand(command, cwd=None, env=None):
-    p = subprocess.Popen(command, cwd=cwd,
-                         stdin=subprocess.PIPE,
-                         stdout=subprocess.PIPE,
-                         stderr=subprocess.PIPE,
-                         env=env)
-    out,err = p.communicate()
-    exitCode = p.wait()
-
-    # Detect Ctrl-C in subprocess.
-    if exitCode == -signal.SIGINT:
-        raise KeyboardInterrupt
-
-    return out, err, exitCode
+kAvoidDevNull = kIsWindows
  
  def executeShCmd(cmd, cfg, cwd, results):
      if isinstance(cmd, ShUtil.Seq):
@@ -41,13 +28,14 @@ def executeShCmd(cmd, cfg, cwd, results):
              return executeShCmd(cmd.rhs, cfg, cwd, results)
  
          if cmd.op == '&':
-            raise NotImplementedError,"unsupported test command: '&'"
+            raise InternalShellError(cmd,"unsupported shell operator: '&'")
  
          if cmd.op == '||':
              res = executeShCmd(cmd.lhs, cfg, cwd, results)
              if res != 0:
                  res = executeShCmd(cmd.rhs, cfg, cwd, results)
              return res
+
          if cmd.op == '&&':
              res = executeShCmd(cmd.lhs, cfg, cwd, results)
              if res is None:
@@ -57,17 +45,19 @@ def executeShCmd(cmd, cfg, cwd, results):
                  res = executeShCmd(cmd.rhs, cfg, cwd, results)
              return res
  
-        raise ValueError,'Unknown shell command: %r' % cmd.op
+        raise ValueError('Unknown shell command: %r' % cmd.op)
  
      assert isinstance(cmd, ShUtil.Pipeline)
      procs = []
      input = subprocess.PIPE
      stderrTempFiles = []
+    opened_files = []
+    named_temp_files = []
      # To avoid deadlock, we use a single stderr stream for piped
      # output. This is null until we have seen some output using
      # stderr.
      for i,j in enumerate(cmd.commands):
-        # Apply the redirections, we use (N,) as a sentinal to indicate stdin,
+        # Apply the redirections, we use (N,) as a sentinel to indicate stdin,
          # stdout, stderr for N equal to 0, 1, or 2 respectively. Redirects to or
          # from a file are represented with a list [file, mode, file-object]
          # where file-object is initially None.
@@ -88,7 +78,7 @@ def executeShCmd(cmd, cfg, cwd, results):
              elif r[0] == ('<',):
                  redirects[0] = [r[1], 'r', None]
              else:
-                raise NotImplementedError,"Unsupported redirect: %r" % (r,)
+                raise InternalShellError(j,"Unsupported redirect: %r" % (r,))
  
          # Map from the final redirections to something subprocess can handle.
          final_redirects = []
@@ -97,14 +87,14 @@ def executeShCmd(cmd, cfg, cwd, results):
                  result = input
              elif r == (1,):
                  if index == 0:
-                    raise NotImplementedError,"Unsupported redirect for stdin"
+                    raise InternalShellError(j,"Unsupported redirect for stdin")
                  elif index == 1:
                      result = subprocess.PIPE
                  else:
                      result = subprocess.STDOUT
              elif r == (2,):
                  if index != 2:
-                    raise NotImplementedError,"Unsupported redirect on stdout"
+                    raise InternalShellError(j,"Unsupported redirect on stdout")
                  result = subprocess.PIPE
              else:
                  if r[2] is None:
@@ -113,8 +103,11 @@ def executeShCmd(cmd, cfg, cwd, results):
                      else:
                          r[2] = open(r[0], r[1])
                      # Workaround a Win32 and/or subprocess bug when appending.
+                    #
+                    # FIXME: Actually, this is probably an instance of PR6753.
                      if r[1] == 'a':
                          r[2].seek(0, 2)
+                    opened_files.append(r[2])
                  result = r[2]
              final_redirects.append(result)
  
@@ -138,10 +131,19 @@ def executeShCmd(cmd, cfg, cwd, results):
  
          # Resolve the executable path ourselves.
          args = list(j.args)
-        args[0] = Util.which(args[0], cfg.environment['PATH'])
+        args[0] = lit.util.which(args[0], cfg.environment['PATH'])
          if not args[0]:
              raise InternalShellError(j, '%r: command not found' % j.args[0])
  
+        # Replace uses of /dev/null with temporary files.
+        if kAvoidDevNull:
+            for i,arg in enumerate(args):
+                if arg == "/dev/null":
+                    f = tempfile.NamedTemporaryFile(delete=False)
+                    f.close()
+                    named_temp_files.append(f.name)
+                    args[i] = f.name
+
          procs.append(subprocess.Popen(args, cwd=cwd,
                                        stdin = stdin,
                                        stdout = stdout,
@@ -162,6 +164,13 @@ def executeShCmd(cmd, cfg, cwd, results):
          else:
              input = subprocess.PIPE
  
+    # Explicitly close any redirected files. We need to do this now because we
+    # need to release any handles we may have on the temporary files (important
+    # on Win32, for example). Since we have already spawned the subprocess, our
+    # handles have already been transferred so we do not need them anymore.
+    for f in opened_files:
+        f.close()
+
      # FIXME: There is probably still deadlock potential here. Yawn.
      procData = [None] * len(procs)
      procData[-1] = procs[-1].communicate()
@@ -176,7 +185,7 @@ def executeShCmd(cmd, cfg, cwd, results):
          else:
              err = ''
          procData[i] = (out,err)
-        
+
      # Read stderr out of the temp files.
      for i,f in stderrTempFiles:
          f.seek(0, 0)
@@ -192,121 +201,50 @@ def executeShCmd(cmd, cfg, cwd, results):
          results.append((cmd.commands[i], out, err, res))
          if cmd.pipe_err:
              # Python treats the exit code as a signed char.
-            if res < 0:
+            if exitCode is None:
+                exitCode = res
+            elif res < 0:
                  exitCode = min(exitCode, res)
              else:
                  exitCode = max(exitCode, res)
          else:
              exitCode = res
  
+    # Remove any named temporary files we created.
+    for f in named_temp_files:
+        try:
+            os.remove(f)
+        except OSError:
+            pass
+
      if cmd.negate:
          exitCode = not exitCode
  
      return exitCode
  
  def executeScriptInternal(test, litConfig, tmpBase, commands, cwd):
-    ln = ' &&\n'.join(commands)
-    try:
-        cmd = ShUtil.ShParser(ln, litConfig.isWindows).parse()
-    except:
-        return (Test.FAIL, "shell parser error on: %r" % ln)
-
-    results = []
-    try:
-        exitCode = executeShCmd(cmd, test.config, cwd, results)
-    except InternalShellError,e:
-        out = ''
-        err = e.message
-        exitCode = 255
-
-    out = err = ''
-    for i,(cmd, cmd_out,cmd_err,res) in enumerate(results):
-        out += 'Command %d: %s\n' % (i, ' '.join('"%s"' % s for s in cmd.args))
-        out += 'Command %d Result: %r\n' % (i, res)
-        out += 'Command %d Output:\n%s\n\n' % (i, cmd_out)
-        out += 'Command %d Stderr:\n%s\n\n' % (i, cmd_err)
-
-    return out, err, exitCode
-
-def executeTclScriptInternal(test, litConfig, tmpBase, commands, cwd):
-    import TclUtil
      cmds = []
      for ln in commands:
-        # Given the unfortunate way LLVM's test are written, the line gets
-        # backslash substitution done twice.
-        ln = TclUtil.TclLexer(ln).lex_unquoted(process_all = True)
-
          try:
-            tokens = list(TclUtil.TclLexer(ln).lex())
+            cmds.append(ShUtil.ShParser(ln, litConfig.isWindows,
+                                        test.config.pipefail).parse())
          except:
-            return (Test.FAIL, "Tcl lexer error on: %r" % ln)
-
-        # Validate there are no control tokens.
-        for t in tokens:
-            if not isinstance(t, str):
-                return (Test.FAIL,
-                        "Invalid test line: %r containing %r" % (ln, t))
-
-        try:
-            cmds.append(TclUtil.TclExecCommand(tokens).parse_pipeline())
-        except:
-            return (Test.FAIL, "Tcl 'exec' parse error on: %r" % ln)
-
-    if litConfig.useValgrind:
-        for pipeline in cmds:
-            if pipeline.commands:
-                # Only valgrind the first command in each pipeline, to avoid
-                # valgrinding things like grep, not, and FileCheck.
-                cmd = pipeline.commands[0]
-                cmd.args = litConfig.valgrindArgs + cmd.args
+            return (Test.FAIL, "shell parser error on: %r" % ln)
  
      cmd = cmds[0]
      for c in cmds[1:]:
          cmd = ShUtil.Seq(cmd, '&&', c)
  
-    # FIXME: This is lame, we shouldn't need bash. See PR5240.
-    bashPath = litConfig.getBashPath()
-    if litConfig.useTclAsSh and bashPath:
-        script = tmpBase + '.script'
-
-        # Write script file
-        f = open(script,'w')
-        print >>f, 'set -o pipefail'
-        cmd.toShell(f, pipefail = True)
-        f.close()
-
-        if 0:
-            print >>sys.stdout, cmd
-            print >>sys.stdout, open(script).read()
-            print >>sys.stdout
-            return '', '', 0
-
-        command = [litConfig.getBashPath(), script]
-        out,err,exitCode = executeCommand(command, cwd=cwd,
-                                          env=test.config.environment)
-
-        # Tcl commands fail on standard error output.
-        if err:
-            exitCode = 1
-            out = 'Command has output on stderr!\n\n' + out
-
-        return out,err,exitCode
-    else:
-        results = []
-        try:
-            exitCode = executeShCmd(cmd, test.config, cwd, results)
-        except InternalShellError,e:
-            results.append((e.command, '', e.message + '\n', 255))
-            exitCode = 255
+    results = []
+    try:
+        exitCode = executeShCmd(cmd, test.config, cwd, results)
+    except InternalShellError:
+        e = sys.exc_info()[1]
+        exitCode = 127
+        results.append((e.command, '', e.message, exitCode))
  
      out = err = ''
-
-    # Tcl commands fail on standard error output.
-    if [True for _,_,err,res in results if err]:
-        exitCode = 1
-        out += 'Command has output on stderr!\n\n'
-
-    for i,(cmd, cmd_out, cmd_err, res) in enumerate(results):
+    for i,(cmd, cmd_out,cmd_err,res) in enumerate(results):
          out += 'Command %d: %s\n' % (i, ' '.join('"%s"' % s for s in cmd.args))
          out += 'Command %d Result: %r\n' % (i, res)
          out += 'Command %d Output:\n%s\n\n' % (i, cmd_out)
@@ -315,50 +253,81 @@ def executeTclScriptInternal(test, litConfig, tmpBase, commands, cwd):
      return out, err, exitCode
  
  def executeScript(test, litConfig, tmpBase, commands, cwd):
+    bashPath = litConfig.getBashPath();
+    isWin32CMDEXE = (litConfig.isWindows and not bashPath)
      script = tmpBase + '.script'
-    if litConfig.isWindows:
+    if isWin32CMDEXE:
          script += '.bat'
  
      # Write script file
-    f = open(script,'w')
-    if litConfig.isWindows:
+    mode = 'w'
+    if litConfig.isWindows and not isWin32CMDEXE:
+      mode += 'b'  # Avoid CRLFs when writing bash scripts.
+    f = open(script, mode)
+    if isWin32CMDEXE:
          f.write('\nif %ERRORLEVEL% NEQ 0 EXIT\n'.join(commands))
      else:
-        f.write(' &&\n'.join(commands))
+        if test.config.pipefail:
+            f.write('set -o pipefail;')
+        f.write('{ ' + '; } &&\n{ '.join(commands) + '; }')
      f.write('\n')
      f.close()
  
-    if litConfig.isWindows:
+    if isWin32CMDEXE:
          command = ['cmd','/c', script]
      else:
-        command = ['/bin/sh', script]
+        if bashPath:
+            command = [bashPath, script]
+        else:
+            command = ['/bin/sh', script]
          if litConfig.useValgrind:
              # FIXME: Running valgrind on sh is overkill. We probably could just
              # run on clang with no real loss.
              command = litConfig.valgrindArgs + command
  
-    return executeCommand(command, cwd=cwd, env=test.config.environment)
+    return lit.util.executeCommand(command, cwd=cwd,
+                                   env=test.config.environment)
  
-def isExpectedFail(xfails, xtargets, target_triple):
-    # Check if any xfail matches this target.
+def isExpectedFail(test, xfails):
+    # Check if any of the xfails match an available feature or the target.
      for item in xfails:
-        if item == '*' or item in target_triple:
-            break
-    else:
-        return False
+        # If this is the wildcard, it always fails.
+        if item == '*':
+            return True
  
-    # If so, see if it is expected to pass on this target.
-    #
-    # FIXME: Rename XTARGET to something that makes sense, like XPASS.
-    for item in xtargets:
-        if item == '*' or item in target_triple:
-            return False
+        # If this is an exact match for one of the features, it fails.
+        if item in test.config.available_features:
+            return True
  
-    return True
+        # If this is a part of the target triple, it fails.
+        if item in test.suite.config.target_triple:
+            return True
  
-def parseIntegratedTestScript(test):
+    return False
+
+def parseIntegratedTestScriptCommands(sourcepath):
+    """
+    parseIntegratedTestScriptCommands(source_path) -> commands
+
+    Parse the commands in an integrated test script file into a list of
+    (line_number, command_type, line).
+    """
+    line_number = 0
+    for ln in open(sourcepath):
+        line_number += 1
+        if 'RUN:' in ln:
+            yield (line_number, 'RUN', ln[ln.index('RUN:')+4:])
+        elif 'XFAIL:' in ln:
+            yield (line_number, 'XFAIL', ln[ln.index('XFAIL:') + 6:])
+        elif 'REQUIRES:' in ln:
+            yield (line_number, 'REQUIRES', ln[ln.index('REQUIRES:') + 9:])
+        elif 'END.' in ln:
+            yield (line_number, 'END', ln[ln.index('END.') + 4:])
+
+def parseIntegratedTestScript(test, normalize_slashes=False,
+                              extra_substitutions=[]):
      """parseIntegratedTestScript - Scan an LLVM/Clang style integrated test
-    script and extract the lines to 'RUN' as well as 'XFAIL' and 'XTARGET'
+    script and extract the lines to 'RUN' as well as 'XFAIL' and 'REQUIRES'
      information. The RUN lines also will have variable substitution performed.
      """
  
@@ -367,127 +336,145 @@ def parseIntegratedTestScript(test):
      #
      # FIXME: This should not be here?
      sourcepath = test.getSourcePath()
+    sourcedir = os.path.dirname(sourcepath)
      execpath = test.getExecPath()
      execdir,execbase = os.path.split(execpath)
-    tmpBase = os.path.join(execdir, 'Output', execbase)
-    if test.index is not None:
-        tmpBase += '_%d' % test.index
+    tmpDir = os.path.join(execdir, 'Output')
+    tmpBase = os.path.join(tmpDir, execbase)
+
+    # Normalize slashes, if requested.
+    if normalize_slashes:
+        sourcepath = sourcepath.replace('\\', '/')
+        sourcedir = sourcedir.replace('\\', '/')
+        tmpDir = tmpDir.replace('\\', '/')
+        tmpBase = tmpBase.replace('\\', '/')
  
      # We use #_MARKER_# to hide %% while we do the other substitutions.
-    substitutions = [('%%', '#_MARKER_#')]
+    substitutions = list(extra_substitutions)
+    substitutions.extend([('%%', '#_MARKER_#')])
      substitutions.extend(test.config.substitutions)
      substitutions.extend([('%s', sourcepath),
-                          ('%S', os.path.dirname(sourcepath)),
-                          ('%p', os.path.dirname(sourcepath)),
+                          ('%S', sourcedir),
+                          ('%p', sourcedir),
+                          ('%{pathsep}', os.pathsep),
                            ('%t', tmpBase + '.tmp'),
-                          # FIXME: Remove this once we kill DejaGNU.
-                          ('%abs_tmp', tmpBase + '.tmp'),
+                          ('%T', tmpDir),
                            ('#_MARKER_#', '%')])
  
+    # "%/[STpst]" should be normalized.
+    substitutions.extend([
+            ('%/s', sourcepath.replace('\\', '/')),
+            ('%/S', sourcedir.replace('\\', '/')),
+            ('%/p', sourcedir.replace('\\', '/')),
+            ('%/t', tmpBase.replace('\\', '/') + '.tmp'),
+            ('%/T', tmpDir.replace('\\', '/')),
+            ])
+
      # Collect the test lines from the script.
      script = []
      xfails = []
-    xtargets = []
-    for ln in open(sourcepath):
-        if 'RUN:' in ln:
-            # Isolate the command to run.
-            index = ln.index('RUN:')
-            ln = ln[index+4:]
-
+    requires = []
+    for line_number, command_type, ln in \
+            parseIntegratedTestScriptCommands(sourcepath):
+        if command_type == 'RUN':
              # Trim trailing whitespace.
              ln = ln.rstrip()
  
+            # Substitute line number expressions
+            ln = re.sub('%\(line\)', str(line_number), ln)
+            def replace_line_number(match):
+                if match.group(1) == '+':
+                    return str(line_number + int(match.group(2)))
+                if match.group(1) == '-':
+                    return str(line_number - int(match.group(2)))
+            ln = re.sub('%\(line *([\+-]) *(\d+)\)', replace_line_number, ln)
+
              # Collapse lines with trailing '\\'.
              if script and script[-1][-1] == '\\':
                  script[-1] = script[-1][:-1] + ln
              else:
                  script.append(ln)
-        elif 'XFAIL:' in ln:
-            items = ln[ln.index('XFAIL:') + 6:].split(',')
-            xfails.extend([s.strip() for s in items])
-        elif 'XTARGET:' in ln:
-            items = ln[ln.index('XTARGET:') + 8:].split(',')
-            xtargets.extend([s.strip() for s in items])
-        elif 'END.' in ln:
-            # Check for END. lines.
-            if ln[ln.index('END.'):].strip() == 'END.':
+        elif command_type == 'XFAIL':
+            xfails.extend([s.strip() for s in ln.split(',')])
+        elif command_type == 'REQUIRES':
+            requires.extend([s.strip() for s in ln.split(',')])
+        elif command_type == 'END':
+            # END commands are only honored if the rest of the line is empty.
+            if not ln.strip():
                  break
+        else:
+            raise ValueError("unknown script command type: %r" % (
+                    command_type,))
  
-    # Apply substitutions to the script.
+    # Apply substitutions to the script.  Allow full regular
+    # expression syntax.  Replace each matching occurrence of regular
+    # expression pattern a with substitution b in line ln.
      def processLine(ln):
          # Apply substitutions
          for a,b in substitutions:
-            ln = ln.replace(a,b)
+            if kIsWindows:
+                b = b.replace("\\","\\\\")
+            ln = re.sub(a, b, ln)
  
          # Strip the trailing newline and any extra whitespace.
          return ln.strip()
-    script = map(processLine, script)
+    script = [processLine(ln)
+              for ln in script]
  
      # Verify the script contains a run line.
      if not script:
          return (Test.UNRESOLVED, "Test has no run line!")
  
+    # Check for unterminated run lines.
      if script[-1][-1] == '\\':
          return (Test.UNRESOLVED, "Test has unterminated run lines (with '\\')")
  
-    isXFail = isExpectedFail(xfails, xtargets, test.suite.config.target_triple)
+    # Check that we have the required features:
+    missing_required_features = [f for f in requires
+                                 if f not in test.config.available_features]
+    if missing_required_features:
+        msg = ', '.join(missing_required_features)
+        return (Test.UNSUPPORTED,
+                "Test requires the following features: %s" % msg)
+
+    isXFail = isExpectedFail(test, xfails)
      return script,isXFail,tmpBase,execdir
  
  def formatTestOutput(status, out, err, exitCode, script):
-    output = StringIO.StringIO()
-    print >>output, "Script:"
-    print >>output, "--"
-    print >>output, '\n'.join(script)
-    print >>output, "--"
-    print >>output, "Exit Code: %r" % exitCode
-    print >>output, "Command Output (stdout):"
-    print >>output, "--"
-    output.write(out)
-    print >>output, "--"
-    print >>output, "Command Output (stderr):"
-    print >>output, "--"
-    output.write(err)
-    print >>output, "--"
-    return (status, output.getvalue())
-
-def executeTclTest(test, litConfig):
-    if test.config.unsupported:
-        return (Test.UNSUPPORTED, 'Test is unsupported')
-
-    res = parseIntegratedTestScript(test)
-    if len(res) == 2:
-        return res
-
-    script, isXFail, tmpBase, execdir = res
-
-    if litConfig.noExecute:
-        return (Test.PASS, '')
-
-    # Create the output directory if it does not already exist.
-    Util.mkdir_p(os.path.dirname(tmpBase))
-
-    res = executeTclScriptInternal(test, litConfig, tmpBase, script, execdir)
-    if len(res) == 2:
-        return res
-
-    out,err,exitCode = res
-    if isXFail:
-        ok = exitCode != 0
-        status = (Test.XPASS, Test.XFAIL)[ok]
-    else:
-        ok = exitCode == 0
-        status = (Test.FAIL, Test.PASS)[ok]
-
-    if ok:
-        return (status,'')
-
-    return formatTestOutput(status, out, err, exitCode, script)
-
-def executeShTest(test, litConfig, useExternalSh):
+    output = """\
+Script:
+--
+%s
+--
+Exit Code: %d
+
+""" % ('\n'.join(script), exitCode)
+
+    # Append the stdout, if present.
+    if out:
+        output += """\
+Command Output (stdout):
+--
+%s
+--
+""" % (out,)
+
+    # Append the stderr, if present.
+    if err:
+        output += """\
+Command Output (stderr):
+--
+%s
+--
+""" % (err,)
+    return (status, output)
+
+def executeShTest(test, litConfig, useExternalSh,
+                  extra_substitutions=[]):
      if test.config.unsupported:
          return (Test.UNSUPPORTED, 'Test is unsupported')
  
-    res = parseIntegratedTestScript(test)
+    res = parseIntegratedTestScript(test, useExternalSh, extra_substitutions)
      if len(res) == 2:
          return res
  
@@ -497,7 +484,7 @@ def executeShTest(test, litConfig, useExternalSh):
          return (Test.PASS, '')
  
      # Create the output directory if it does not already exist.
-    Util.mkdir_p(os.path.dirname(tmpBase))
+    lit.util.mkdir_p(os.path.dirname(tmpBase))
  
      if useExternalSh:
          res = executeScript(test, litConfig, tmpBase, script, execdir)
@@ -509,10 +496,16 @@ def executeShTest(test, litConfig, useExternalSh):
      out,err,exitCode = res
      if isXFail:
          ok = exitCode != 0
-        status = (Test.XPASS, Test.XFAIL)[ok]
+        if ok:
+            status = Test.XFAIL
+        else:
+            status = Test.XPASS
      else:
          ok = exitCode == 0
-        status = (Test.FAIL, Test.PASS)[ok]
+        if ok:
+            status = Test.PASS
+        else:
+            status = Test.FAIL
  
      if ok:
          return (status,'')