blob: bbad8491f798de9fe986f2141bef5609026a4fe9 [file] [log] [blame]
// Copyright 2014 The Bazel Authors. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package com.google.devtools.build.lib.shell;
import java.util.List;
/**
* Utility functions for Bourne shell commands, including escaping and
* tokenizing.
*/
public abstract class ShellUtils {
private ShellUtils() {}
/**
* Characters that have no special meaning to the shell.
*/
private static final String SAFE_PUNCTUATION = "@%-_+:,./";
/**
* Quotes a word so that it can be used, without further quoting,
* as an argument (or part of an argument) in a shell command.
*/
public static String shellEscape(String word) {
int len = word.length();
if (len == 0) {
// Empty string is a special case: needs to be quoted to ensure that it gets
// treated as a separate argument.
return "''";
}
for (int ii = 0; ii < len; ii++) {
char c = word.charAt(ii);
// We do this positively so as to be sure we don't inadvertently forget
// any unsafe characters.
if (!Character.isLetterOrDigit(c) && SAFE_PUNCTUATION.indexOf(c) == -1) {
// replace() actually means "replace all".
return "'" + word.replace("'", "'\\''") + "'";
}
}
return word;
}
/**
* Given an argv array such as might be passed to execve(2), returns a string
* that can be copied and pasted into a Bourne shell for a similar effect.
*/
public static String prettyPrintArgv(List<String> argv) {
StringBuilder buf = new StringBuilder();
for (String arg: argv) {
if (buf.length() > 0) {
buf.append(' ');
}
buf.append(shellEscape(arg));
}
return buf.toString();
}
/**
* Thrown by tokenize method if there is an error
*/
public static class TokenizationException extends Exception {
TokenizationException(String message) {
super(message);
}
}
/**
* Populates the passed list of command-line options extracted from {@code
* optionString}, which is a string containing multiple options, delimited in
* a Bourne shell-like manner.
*
* @param options the list to be populated with tokens.
* @param optionString the string to be tokenized.
* @throws TokenizationException if there was an error (such as an
* unterminated quotation).
*/
public static void tokenize(List<String> options, String optionString)
throws TokenizationException {
// See test suite for examples.
//
// Note: backslash escapes the following character, except within a
// single-quoted region where it is literal.
StringBuilder token = new StringBuilder();
boolean forceToken = false;
char quotation = '\0'; // NUL, '\'' or '"'
for (int ii = 0, len = optionString.length(); ii < len; ii++) {
char c = optionString.charAt(ii);
if (quotation != '\0') { // in quotation
if (c == quotation) { // end of quotation
quotation = '\0';
} else if (c == '\\' && quotation == '"') { // backslash in "-quotation
if (++ii == len) {
throw new TokenizationException("backslash at end of string");
}
c = optionString.charAt(ii);
if (c != '\\' && c != '"') {
token.append('\\');
}
token.append(c);
} else { // regular char, in quotation
token.append(c);
}
} else { // not in quotation
if (c == '\'' || c == '"') { // begin single/double quotation
quotation = c;
forceToken = true;
} else if (c == ' ' || c == '\t') { // space, not quoted
if (forceToken || token.length() > 0) {
options.add(token.toString());
token = new StringBuilder();
forceToken = false;
}
} else if (c == '\\') { // backslash, not quoted
if (++ii == len) {
throw new TokenizationException("backslash at end of string");
}
token.append(optionString.charAt(ii));
} else { // regular char, not quoted
token.append(c);
}
}
}
if (quotation != '\0') {
throw new TokenizationException("unterminated quotation");
}
if (forceToken || token.length() > 0) {
options.add(token.toString());
}
}
/**
* Escape command line arguments for {@code CreateProcessW} on Windows.
*
* <p>This method implements the same algorithm as the native xx_binary launcher does (see
* https://github.com/bazelbuild/bazel/pull/7411).
*
* <p>A similar algorithm with lots of background information is described here:
* https://blogs.msdn.microsoft.com/twistylittlepassagesallalike/2011/04/23/
*/
public static String windowsEscapeArg(String s) {
if (s.isEmpty()) {
return "\"\"";
} else {
boolean needsEscape = false;
for (int i = 0; i < s.length(); ++i) {
char c = s.charAt(i);
if (c == ' ' || c == '"') {
needsEscape = true;
break;
}
}
if (!needsEscape) {
return s;
}
}
StringBuilder result = new StringBuilder();
result.append('"');
int start = 0;
for (int i = 0; i < s.length(); ++i) {
char c = s.charAt(i);
if (c == '"' || c == '\\') {
// Copy the segment since the last special character.
if (start >= 0) {
result.append(s, start, i);
start = -1;
}
// Handle the current special character.
if (c == '"') {
// This is a quote character. Escape it with a single backslash.
result.append("\\\"");
} else {
// This is a backslash (or the first one in a run of backslashes).
// Whether we escape it depends on whether the run ends with a quote.
int runLen = 1;
int j = i + 1;
while (j < s.length() && s.charAt(j) == '\\') {
runLen++;
j++;
}
if (j == s.length()) {
// The run of backslashes goes to the end.
// We have to escape every backslash with another backslash.
for (int k = 0; k < runLen * 2; ++k) {
result.append('\\');
}
break;
} else if (j < s.length() && s.charAt(j) == '"') {
// The run of backslashes is terminated by a quote.
// We have to escape every backslash with another backslash, and
// escape the quote with one backslash.
for (int k = 0; k < runLen * 2; ++k) {
result.append('\\');
}
result.append("\\\"");
i += runLen; // 'i' is also increased in the loop iteration step
} else {
// No quote found. Each backslash counts for itself, they must not be
// escaped.
for (int k = 0; k < runLen; ++k) {
result.append('\\');
}
i += runLen - 1; // 'i' is also increased in the loop iteration step
}
}
} else {
// This is not a special character. Start the segment if necessary.
if (start < 0) {
start = i;
}
}
}
// Save final segment after the last special character.
if (start != -1) {
result.append(s, start, s.length());
}
result.append('"');
return result.toString();
}
}