[PATCH] [Support] Fix argv string escape bug on Windows

Aaron Ballman aaron at aaronballman.com
Mon Apr 22 11:42:07 PDT 2013


LGTM!

~Aaron

On Mon, Apr 22, 2013 at 2:36 PM, Reid Kleckner <rnk at google.com> wrote:
> Hi Bigcheese,
>
> This is http://llvm.org/PR15802.  Backslashes preceding double quotes in
> arguments must be escaped.  The interesting bit is that all other
> backslashes should *not* be escaped, because the un-escaping logic is
> only triggered by the presence of a double quote character.
>
> http://llvm-reviews.chandlerc.com/D705
>
> Files:
>   lib/Support/Windows/Program.inc
>   unittests/Support/CMakeLists.txt
>   unittests/Support/ProgramTest.cpp
>
> Index: lib/Support/Windows/Program.inc
> ===================================================================
> --- lib/Support/Windows/Program.inc
> +++ lib/Support/Windows/Program.inc
> @@ -126,15 +126,46 @@
>    return Str[0] == '\0' || strpbrk(Str, "\t \"&\'()*<>\\`^|") != 0;
>  }
>
> +/// CountPrecedingBackslashes - Returns the number of backslashes preceding Cur
> +/// in the C string Start.
> +static unsigned int CountPrecedingBackslashes(const char *Start,
> +                                              const char *Cur) {
> +  unsigned int Count = 0;
> +  --Cur;
> +  while (Cur >= Start && *Cur == '\\') {
> +    ++Count;
> +    --Cur;
> +  }
> +  return Count;
> +}
> +
> +/// EscapePrecedingEscapes - Append a backslash to Dst for every backslash
> +/// preceding Cur in the Start string.  Assumes Dst has enough space.
> +static char *EscapePrecedingEscapes(char *Dst, const char *Start,
> +                                    const char *Cur) {
> +  unsigned PrecedingEscapes = CountPrecedingBackslashes(Start, Cur);
> +  while (PrecedingEscapes > 0) {
> +    *Dst++ = '\\';
> +    --PrecedingEscapes;
> +  }
> +  return Dst;
> +}
>
>  /// ArgLenWithQuotes - Check whether argument needs to be quoted when calling
>  /// CreateProcess and returns length of quoted arg with escaped quotes
>  static unsigned int ArgLenWithQuotes(const char *Str) {
> +  const char *Start = Str;
>    unsigned int len = ArgNeedsQuotes(Str) ? 2 : 0;
>
>    while (*Str != '\0') {
> -    if (*Str == '\"')
> -      ++len;
> +    if (*Str == '\"') {
> +      // We need to add a backslash, but ensure that it isn't escaped.
> +      unsigned PrecedingEscapes = CountPrecedingBackslashes(Start, Str);
> +      len += PrecedingEscapes + 1;
> +    }
> +    // Note that we *don't* need to escape runs of backslashes that don't
> +    // precede a double quote!  See MSDN:
> +    // http://msdn.microsoft.com/en-us/library/17w5ykft%28v=vs.85%29.aspx
>
>      ++len;
>      ++Str;
> @@ -180,20 +211,27 @@
>
>    for (unsigned i = 0; args[i]; i++) {
>      const char *arg = args[i];
> +    const char *start = arg;
>
>      bool needsQuoting = ArgNeedsQuotes(arg);
>      if (needsQuoting)
>        *p++ = '"';
>
>      while (*arg != '\0') {
> -      if (*arg == '\"')
> +      if (*arg == '\"') {
> +        // Escape all preceding escapes (if any), and then escape the quote.
> +        p = EscapePrecedingEscapes(p, start, arg);
>          *p++ = '\\';
> +      }
>
>        *p++ = *arg++;
>      }
>
> -    if (needsQuoting)
> +    if (needsQuoting) {
> +      // Make sure our quote doesn't get escaped by a trailing backslash.
> +      p = EscapePrecedingEscapes(p, start, arg);
>        *p++ = '"';
> +    }
>      *p++ = ' ';
>    }
>
> Index: unittests/Support/CMakeLists.txt
> ===================================================================
> --- unittests/Support/CMakeLists.txt
> +++ unittests/Support/CMakeLists.txt
> @@ -23,6 +23,7 @@
>    MemoryTest.cpp
>    Path.cpp
>    ProcessTest.cpp
> +  ProgramTest.cpp
>    RegexTest.cpp
>    SwapByteOrderTest.cpp
>    TimeValue.cpp
> Index: unittests/Support/ProgramTest.cpp
> ===================================================================
> --- /dev/null
> +++ unittests/Support/ProgramTest.cpp
> @@ -0,0 +1,63 @@
> +//===- unittest/Support/ProgramTest.cpp -----------------------------------===//
> +//
> +//                     The LLVM Compiler Infrastructure
> +//
> +// This file is distributed under the University of Illinois Open Source
> +// License. See LICENSE.TXT for details.
> +//
> +//===----------------------------------------------------------------------===//
> +
> +#include "llvm/Support/CommandLine.h"
> +#include "llvm/Support/Path.h"
> +#include "llvm/Support/Program.h"
> +#include "gtest/gtest.h"
> +
> +#include <stdlib.h>
> +
> +namespace {
> +
> +using namespace llvm;
> +using namespace sys;
> +
> +static cl::opt<std::string>
> +ProgramTestStringArg1("program-test-string-arg1");
> +static cl::opt<std::string>
> +ProgramTestStringArg2("program-test-string-arg2");
> +
> +TEST(ProgramTest, CreateProcessTrailingSlash) {
> +  if (getenv("LLVM_PROGRAM_TEST_CHILD")) {
> +    if (ProgramTestStringArg1 == "has\\\\ trailing\\" &&
> +        ProgramTestStringArg2 == "has\\\\ trailing\\") {
> +      exit(0);  // Success!  The arguments were passed and parsed.
> +    }
> +    exit(1);
> +  }
> +
> +  // FIXME: Hardcoding argv0 here since I don't know a good cross-platform way
> +  // to get it.  Maybe ParseCommandLineOptions() should save it?
> +  Path my_exe = Path::GetMainExecutable("SupportTests", &ProgramTestStringArg1);
> +  const char *argv[] = {
> +    my_exe.c_str(),
> +    "--gtest_filter=ProgramTest.CreateProcessTrailingSlashChild",
> +    "-program-test-string-arg1", "has\\\\ trailing\\",
> +    "-program-test-string-arg2", "has\\\\ trailing\\",
> +    0
> +  };
> +  const char *envp[] = { "LLVM_PROGRAM_TEST_CHILD=1", 0 };
> +  std::string error;
> +  bool ExecutionFailed;
> +  // Redirect stdout and stdin to NUL, but let stderr through.
> +#ifdef LLVM_ON_WIN32
> +  Path nul("NUL");
> +#else
> +  Path nul("/dev/null");
> +#endif
> +  const Path *redirects[] = { &nul, &nul, 0 };
> +  int rc = Program::ExecuteAndWait(my_exe, argv, envp, redirects,
> +                                   /*secondsToWait=*/10, /*memoryLimit=*/0,
> +                                   &error, &ExecutionFailed);
> +  EXPECT_FALSE(ExecutionFailed) << error;
> +  EXPECT_EQ(0, rc);
> +}
> +
> +} // end anonymous namespace
>
> _______________________________________________
> llvm-commits mailing list
> llvm-commits at cs.uiuc.edu
> http://lists.cs.uiuc.edu/mailman/listinfo/llvm-commits
>



More information about the llvm-commits mailing list