| // Copyright 2018 The Bazel Authors. All rights reserved. |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| #include "src/main/cpp/util/path_platform.h" |
| |
| #include <assert.h> |
| #include <wchar.h> // wcslen |
| #include <windows.h> |
| |
| #include <algorithm> |
| #include <memory> // unique_ptr |
| #include <sstream> |
| #include <vector> |
| |
| #include "src/main/cpp/util/errors.h" |
| #include "src/main/cpp/util/exit_code.h" |
| #include "src/main/cpp/util/file_platform.h" |
| #include "src/main/cpp/util/logging.h" |
| #include "src/main/cpp/util/strings.h" |
| #include "src/main/native/windows/file.h" |
| |
| namespace blaze_util { |
| |
| using bazel::windows::HasUncPrefix; |
| |
| static char GetCurrentDrive(); |
| |
| template <typename char_type> |
| struct CharTraits { |
| static bool IsAlpha(char_type ch); |
| }; |
| |
| template <> |
| struct CharTraits<char> { |
| static bool IsAlpha(char ch) { return isalpha(ch); } |
| }; |
| |
| template <> |
| struct CharTraits<wchar_t> { |
| static bool IsAlpha(wchar_t ch) { return iswalpha(ch); } |
| }; |
| |
| template <typename char_type> |
| static bool IsPathSeparator(char_type ch) { |
| return ch == '/' || ch == '\\'; |
| } |
| |
| template <typename char_type> |
| static bool HasDriveSpecifierPrefix(const char_type* ch) { |
| return CharTraits<char_type>::IsAlpha(ch[0]) && ch[1] == ':'; |
| } |
| |
| std::string ConvertPath(const std::string& path) { |
| // The path may not be Windows-style and may not be normalized, so convert it. |
| std::string converted_path; |
| std::string error; |
| if (!blaze_util::AsWindowsPath(path, &converted_path, &error)) { |
| BAZEL_DIE(blaze_exit_code::LOCAL_ENVIRONMENTAL_ERROR) |
| << "ConvertPath(" << path << "): AsWindowsPath failed: " << error; |
| } |
| std::transform(converted_path.begin(), converted_path.end(), |
| converted_path.begin(), ::tolower); |
| return converted_path; |
| } |
| |
| std::string MakeAbsolute(const std::string& path) { |
| // The path may not be Windows-style and may not be normalized, so convert it. |
| std::wstring wpath; |
| std::string error; |
| if (!AsAbsoluteWindowsPath(path, &wpath, &error)) { |
| BAZEL_DIE(blaze_exit_code::LOCAL_ENVIRONMENTAL_ERROR) |
| << "MakeAbsolute(" << path |
| << "): AsAbsoluteWindowsPath failed: " << error; |
| } |
| std::transform(wpath.begin(), wpath.end(), wpath.begin(), ::towlower); |
| return std::string( |
| WstringToCstring(RemoveUncPrefixMaybe(wpath.c_str())).get()); |
| } |
| |
| std::string MakeAbsoluteAndResolveWindowsEnvvars(const std::string& path) { |
| // Get the size of the expanded string, so we know how big of a buffer to |
| // provide. The returned size includes the null terminator. |
| std::unique_ptr<CHAR[]> resolved(new CHAR[MAX_PATH]); |
| DWORD size = |
| ::ExpandEnvironmentStrings(path.c_str(), resolved.get(), MAX_PATH); |
| if (size == 0) { |
| BAZEL_DIE(blaze_exit_code::LOCAL_ENVIRONMENTAL_ERROR) |
| << "MakeAbsoluteAndResolveWindowsEnvvars(" << path |
| << "): ExpandEnvironmentStrings failed: " << GetLastErrorString(); |
| } else if (size > MAX_PATH) { |
| // Try again with a buffer bigger than MAX_PATH. |
| resolved.reset(new CHAR[size]); |
| DWORD second_size = |
| ::ExpandEnvironmentStrings(path.c_str(), resolved.get(), size); |
| if (second_size == 0) { |
| BAZEL_DIE(blaze_exit_code::LOCAL_ENVIRONMENTAL_ERROR) |
| << "MakeAbsoluteAndResolveWindowsEnvvars(" << path |
| << "): ExpandEnvironmentStrings failed with second buffer: " |
| << GetLastErrorString(); |
| } |
| assert(second_size <= size); |
| } |
| return MakeAbsolute(std::string(resolved.get())); |
| } |
| |
| bool CompareAbsolutePaths(const std::string& a, const std::string& b) { |
| return ConvertPath(a) == ConvertPath(b); |
| } |
| |
| std::string PathAsJvmFlag(const std::string& path) { |
| std::string cpath; |
| std::string error; |
| if (!AsWindowsPath(path, &cpath, &error)) { |
| BAZEL_DIE(blaze_exit_code::LOCAL_ENVIRONMENTAL_ERROR) |
| << "PathAsJvmFlag(" << path << "): AsWindowsPath failed: " << error; |
| } |
| // Convert forward slashes and backslashes to double (escaped) backslashes, so |
| // they are safe to pass on the command line to the JVM and the JVM won't |
| // misinterpret them. |
| // See https://github.com/bazelbuild/bazel/issues/2576 and |
| // https://github.com/bazelbuild/bazel/issues/6098 |
| size_t separators = 0; |
| for (const auto& c : cpath) { |
| if (c == '/' || c == '\\') { |
| separators++; |
| } |
| } |
| // In the result we replace each '/' and '\' with "\\", i.e. the total size |
| // *increases* by `separators`. |
| // Create a string of that size, filled with zeroes. |
| std::string result(/* count */ cpath.size() + separators, '\0'); |
| std::string::size_type i = 0; |
| for (const auto& c : cpath) { |
| if (c == '/' || c == '\\') { |
| result[i++] = '\\'; |
| result[i++] = '\\'; |
| } else { |
| result[i++] = c; |
| } |
| } |
| return result; |
| } |
| |
| void AddUncPrefixMaybe(std::wstring* path) { |
| if (path->size() >= MAX_PATH && !HasUncPrefix(path->c_str())) { |
| *path = std::wstring(L"\\\\?\\") + *path; |
| } |
| } |
| |
| const wchar_t* RemoveUncPrefixMaybe(const wchar_t* ptr) { |
| return ptr + (HasUncPrefix(ptr) ? 4 : 0); |
| } |
| |
| // Checks if the path is absolute and/or is a root path. |
| // |
| // If `must_be_root` is true, then in addition to being absolute, the path must |
| // also be just the root part, no other components, e.g. "c:\" is both absolute |
| // and root, but "c:\foo" is just absolute. |
| template <typename char_type> |
| static bool IsRootOrAbsolute(const std::basic_string<char_type>& path, |
| bool must_be_root) { |
| // An absolute path is one that starts with "/", "\", "c:/", "c:\", |
| // "\\?\c:\", or rarely "\??\c:\" or "\\.\c:\". |
| // |
| // It is unclear whether the UNC prefix is just "\\?\" or is "\??\" also |
| // valid (in some cases it seems to be, though MSDN doesn't mention it). |
| return |
| // path is (or starts with) "/" or "\" |
| ((must_be_root ? path.size() == 1 : !path.empty()) && |
| IsPathSeparator(path[0])) || |
| // path is (or starts with) "c:/" or "c:\" or similar |
| ((must_be_root ? path.size() == 3 : path.size() >= 3) && |
| HasDriveSpecifierPrefix(path.c_str()) && IsPathSeparator(path[2])) || |
| // path is (or starts with) "\\?\c:\" or "\??\c:\" or similar |
| ((must_be_root ? path.size() == 7 : path.size() >= 7) && |
| HasUncPrefix(path.c_str()) && |
| HasDriveSpecifierPrefix(path.c_str() + 4) && IsPathSeparator(path[6])); |
| } |
| |
| template <typename char_type> |
| static std::pair<std::basic_string<char_type>, std::basic_string<char_type> > |
| SplitPathImpl(const std::basic_string<char_type>& path) { |
| if (path.empty()) { |
| return std::make_pair(std::basic_string<char_type>(), |
| std::basic_string<char_type>()); |
| } |
| |
| size_t pos = path.size() - 1; |
| for (auto it = path.crbegin(); it != path.crend(); ++it, --pos) { |
| if (IsPathSeparator(*it)) { |
| if ((pos == 2 || pos == 6) && |
| IsRootOrAbsolute(path.substr(0, pos + 1), /* must_be_root */ true)) { |
| // Windows path, top-level directory, e.g. "c:\foo", |
| // result is ("c:\", "foo"). |
| // Or UNC path, top-level directory, e.g. "\\?\c:\foo" |
| // result is ("\\?\c:\", "foo"). |
| return std::make_pair( |
| // Include the "/" or "\" in the drive specifier. |
| path.substr(0, pos + 1), path.substr(pos + 1)); |
| } else { |
| // Windows path (neither top-level nor drive root), Unix path, or |
| // relative path. |
| return std::make_pair( |
| // If the only "/" is the leading one, then that shall be the first |
| // pair element, otherwise the substring up to the rightmost "/". |
| pos == 0 ? path.substr(0, 1) : path.substr(0, pos), |
| // If the rightmost "/" is the tail, then the second pair element |
| // should be empty. |
| pos == path.size() - 1 ? std::basic_string<char_type>() |
| : path.substr(pos + 1)); |
| } |
| } |
| } |
| // Handle the case with no '/' or '\' in `path`. |
| return std::make_pair(std::basic_string<char_type>(), path); |
| } |
| |
| std::pair<std::string, std::string> SplitPath(const std::string& path) { |
| return SplitPathImpl(path); |
| } |
| |
| std::pair<std::wstring, std::wstring> SplitPathW(const std::wstring& path) { |
| return SplitPathImpl(path); |
| } |
| |
| void assignNUL(std::string* s) { s->assign("NUL"); } |
| |
| void assignNUL(std::wstring* s) { s->assign(L"NUL"); } |
| |
| // Returns a normalized form of the input `path`. |
| // |
| // Normalization: |
| // Normalization means removing "." references, resolving ".." references, |
| // and deduplicating "/" characters while converting them to "\\". For |
| // example if `path` is "foo/../bar/.//qux", the result is "bar\\qux". |
| // |
| // Uplevel references ("..") that cannot go any higher in the directory tree |
| // are preserved if the path is relative, and ignored if the path is |
| // absolute, e.g. "../../foo" is normalized to "..\\..\\foo" but "c:/.." is |
| // normalized to "c:\\". |
| // |
| // This method does not check the semantics of the `path` beyond checking if |
| // it starts with a directory separator. Illegal paths such as one with a |
| // drive specifier in the middle (e.g. "foo/c:/bar") are accepted -- it's the |
| // caller's responsibility to pass a path that, when normalized, will be |
| // semantically correct. |
| // |
| // Current directory references (".") are preserved if and only if they are |
| // the only path segment, so "./" becomes "." but "./foo" becomes "foo". |
| // |
| // Arguments: |
| // `path` must be a relative or absolute Windows path, it may use "/" instead |
| // of "\\". The path should not start with "/" or "\\". |
| // |
| // Result: |
| // Returns false if and only if the path starts with a directory separator. |
| // |
| // The result won't have a UNC prefix, even if `path` did. The result won't |
| // have a trailing "\\" except when and only when the path is normalized to |
| // just a drive specifier (e.g. when `path` is "c:/" or "c:/foo/.."). The |
| // result will preserve the casing of the input, so "D:/Bar" becomes |
| // "D:\\Bar". |
| template <typename char_type> |
| static bool NormalizeWindowsPath(const std::basic_string<char_type>& path, |
| std::basic_string<char_type>* result) { |
| if (path.empty()) { |
| *result = path; |
| return true; |
| } |
| if (IsPathSeparator(path[0])) { |
| return false; |
| } |
| |
| static const std::basic_string<char_type> kDot = |
| std::basic_string<char_type>(1, '.'); |
| static const std::basic_string<char_type> kDotDot = |
| std::basic_string<char_type>(2, '.'); |
| |
| std::vector<std::basic_string<char_type> > segments; |
| std::basic_string<char_type>::size_type seg_start = path.size(); |
| std::basic_string<char_type>::size_type total_len = 0; |
| for (std::basic_string<char_type>::size_type i = |
| HasUncPrefix(path.c_str()) ? 4 : 0; |
| i <= path.size(); ++i) { |
| if (i == path.size() || IsPathSeparator(path[i])) { |
| // The current character ends a segment. |
| if (seg_start < path.size() && i > seg_start) { |
| std::basic_string<char_type> seg = |
| i == path.size() ? path.substr(seg_start) |
| : path.substr(seg_start, i - seg_start); |
| if (seg == kDotDot) { |
| if (segments.empty() || segments.back() == kDotDot) { |
| // Preserve ".." if the path is relative and there are only ".." |
| // segment(s) at the front. |
| segments.push_back(seg); |
| total_len += 2; |
| } else if (segments.size() == 1 && segments.back() == kDot) { |
| // Replace the existing "." if that was the only path segment. |
| segments[0] = seg; |
| total_len = 2; |
| } else if (segments.size() > 1 || |
| !HasDriveSpecifierPrefix(segments.back().c_str())) { |
| // Remove the last segment unless the path is already at the root |
| // directory. |
| total_len -= segments.back().size(); |
| segments.pop_back(); |
| } |
| } else if (seg == kDot) { |
| if (segments.empty()) { |
| // Preserve "." if and only if it's the first path segment. |
| // Subsequent segments may replace this segment. |
| segments.push_back(seg); |
| total_len = 1; |
| } |
| } else { |
| // This is a normal path segment, i.e. neither "." nor ".." |
| if (segments.size() == 1 && segments[0] == kDot) { |
| // Replace the only path segment if it was "." |
| segments[0] = seg; |
| total_len = seg.size(); |
| } else { |
| // Store the current segment. |
| segments.push_back(seg); |
| total_len += seg.size(); |
| } |
| } |
| } |
| // Indicate that there's no segment started. |
| seg_start = path.size(); |
| } else { |
| // The current character starts a new segment, or is inside one. |
| if (seg_start == path.size()) { |
| // The current character starts the segment. |
| seg_start = i; |
| } |
| } |
| } |
| if (segments.empty()) { |
| result->clear(); |
| return true; |
| } |
| if (segments.size() == 1 && |
| HasDriveSpecifierPrefix(segments.back().c_str())) { |
| *result = segments.back() + std::basic_string<char_type>(1, '\\'); |
| return true; |
| } |
| // Reserve enough space for all segments plus separators between them (one |
| // less than segments.size()). |
| *result = std::basic_string<char_type>(total_len + segments.size() - 1, 0); |
| std::basic_string<char_type>::iterator pos = result->begin(); |
| std::basic_string<char_type>::size_type idx = 0; |
| for (const auto& seg : segments) { |
| std::copy(seg.cbegin(), seg.cend(), pos); |
| pos += seg.size(); |
| if (pos < result->cend() - 1) { |
| // Add a separator if we haven't reached the end of the string yet. |
| *pos++ = '\\'; |
| } |
| } |
| return true; |
| } |
| |
| template <typename char_type> |
| bool AsWindowsPath(const std::basic_string<char_type>& path, |
| std::basic_string<char_type>* result, std::string* error) { |
| if (path.empty()) { |
| result->clear(); |
| return true; |
| } |
| if (IsDevNull(path.c_str())) { |
| assignNUL(result); |
| return true; |
| } |
| if (HasUncPrefix(path.c_str())) { |
| // Path has "\\?\" prefix --> assume it's already Windows-style. |
| *result = path.c_str(); |
| return true; |
| } |
| if (IsPathSeparator(path[0]) && path.size() > 1 && IsPathSeparator(path[1])) { |
| // Unsupported path: "\\" or "\\server\path", or some degenerate form of |
| // these, such as "//foo". |
| if (error) { |
| *error = "network paths are unsupported"; |
| } |
| return false; |
| } |
| if (HasDriveSpecifierPrefix(path.c_str()) && |
| (path.size() < 3 || !IsPathSeparator(path[2]))) { |
| // Unsupported path: "c:" or "c:foo" |
| if (error) { |
| *error = "working-directory relative paths are unsupported"; |
| } |
| return false; |
| } |
| |
| std::basic_string<char_type> mutable_path = path; |
| if (path[0] == '/') { |
| if (error) { |
| *error = "Unix-style paths are unsupported"; |
| } |
| return false; |
| } |
| |
| if (path[0] == '\\') { |
| // This is an absolute Windows path on the current drive, e.g. "\foo\bar". |
| std::basic_string<char_type> drive(1, GetCurrentDrive()); |
| drive.push_back(':'); |
| mutable_path = drive + path; |
| } // otherwise this is a relative path, or absolute Windows path. |
| |
| if (!NormalizeWindowsPath(mutable_path, result)) { |
| if (error) { |
| *error = "path normalization failed"; |
| } |
| return false; |
| } |
| return true; |
| } |
| |
| bool AsWindowsPath(const std::string& path, std::wstring* result, |
| std::string* error) { |
| std::string normalized_win_path; |
| if (!AsWindowsPath(path, &normalized_win_path, error)) { |
| return false; |
| } |
| |
| result->assign(CstringToWstring(normalized_win_path.c_str()).get()); |
| return true; |
| } |
| |
| template <typename char_type> |
| bool AsAbsoluteWindowsPath(const std::basic_string<char_type>& path, |
| std::wstring* result, std::string* error) { |
| if (path.empty()) { |
| result->clear(); |
| return true; |
| } |
| if (IsDevNull(path.c_str())) { |
| result->assign(L"NUL"); |
| return true; |
| } |
| if (!AsWindowsPath(path, result, error)) { |
| return false; |
| } |
| if (!IsRootOrAbsolute(*result, /* must_be_root */ false)) { |
| if (result->empty() || (result->size() == 1 && (*result)[0] == '.')) { |
| *result = GetCwdW(); |
| } else { |
| *result = GetCwdW() + L"\\" + *result; |
| } |
| } |
| if (!HasUncPrefix(result->c_str())) { |
| *result = std::wstring(L"\\\\?\\") + *result; |
| } |
| return true; |
| } |
| |
| bool AsShortWindowsPath(const std::string& path, std::string* result, |
| std::string* error) { |
| if (IsDevNull(path.c_str())) { |
| result->assign("NUL"); |
| return true; |
| } |
| |
| result->clear(); |
| std::wstring wpath; |
| std::wstring wsuffix; |
| if (!AsAbsoluteWindowsPath(path, &wpath, error)) { |
| return false; |
| } |
| DWORD size = ::GetShortPathNameW(wpath.c_str(), nullptr, 0); |
| if (size == 0) { |
| // GetShortPathNameW can fail if `wpath` does not exist. This is expected |
| // when we are about to create a file at that path, so instead of failing, |
| // walk up in the path until we find a prefix that exists and can be |
| // shortened, or is a root directory. Save the non-existent tail in |
| // `wsuffix`, we'll add it back later. |
| std::vector<std::wstring> segments; |
| while (size == 0 && !IsRootDirectoryW(wpath)) { |
| std::pair<std::wstring, std::wstring> split = SplitPathW(wpath); |
| wpath = split.first; |
| segments.push_back(split.second); |
| size = ::GetShortPathNameW(wpath.c_str(), nullptr, 0); |
| } |
| |
| // Join all segments. |
| std::wostringstream builder; |
| bool first = true; |
| for (auto it = segments.crbegin(); it != segments.crend(); ++it) { |
| if (!first || !IsRootDirectoryW(wpath)) { |
| builder << L'\\' << *it; |
| } else { |
| builder << *it; |
| } |
| first = false; |
| } |
| wsuffix = builder.str(); |
| } |
| |
| std::wstring wresult; |
| if (IsRootDirectoryW(wpath)) { |
| // Strip the UNC prefix from `wpath`, and the leading "\" from `wsuffix`. |
| wresult = std::wstring(RemoveUncPrefixMaybe(wpath.c_str())) + wsuffix; |
| } else { |
| std::unique_ptr<WCHAR[]> wshort( |
| new WCHAR[size]); // size includes null-terminator |
| if (size - 1 != ::GetShortPathNameW(wpath.c_str(), wshort.get(), size)) { |
| if (error) { |
| std::string last_error = GetLastErrorString(); |
| std::stringstream msg; |
| msg << "AsShortWindowsPath(" << path << "): GetShortPathNameW(" |
| << WstringToString(wpath) << ") failed: " << last_error; |
| *error = msg.str(); |
| } |
| return false; |
| } |
| // GetShortPathNameW may preserve the UNC prefix in the result, so strip it. |
| wresult = std::wstring(RemoveUncPrefixMaybe(wshort.get())) + wsuffix; |
| } |
| |
| result->assign(WstringToCstring(wresult.c_str()).get()); |
| ToLower(result); |
| return true; |
| } |
| |
| bool IsDevNull(const char* path) { |
| return path != NULL && *path != 0 && |
| (strncmp("/dev/null\0", path, 10) == 0 || |
| ((path[0] == 'N' || path[0] == 'n') && |
| (path[1] == 'U' || path[1] == 'u') && |
| (path[2] == 'L' || path[2] == 'l') && path[3] == 0)); |
| } |
| |
| bool IsDevNull(const wchar_t* path) { |
| return path != NULL && *path != 0 && |
| (wcsncmp(L"/dev/null\0", path, 10) == 0 || |
| ((path[0] == L'N' || path[0] == L'n') && |
| (path[1] == L'U' || path[1] == L'u') && |
| (path[2] == L'L' || path[2] == L'l') && path[3] == 0)); |
| } |
| |
| bool IsRootDirectory(const std::string& path) { |
| return IsRootOrAbsolute(path, true); |
| } |
| |
| bool IsAbsolute(const std::string& path) { |
| return IsRootOrAbsolute(path, false); |
| } |
| |
| bool IsAbsolute(const std::wstring& path) { |
| return IsRootOrAbsolute(path, false); |
| } |
| |
| bool IsRootDirectoryW(const std::wstring& path) { |
| return IsRootOrAbsolute(path, true); |
| } |
| |
| static char GetCurrentDrive() { |
| std::wstring cwd = GetCwdW(); |
| wchar_t wdrive = RemoveUncPrefixMaybe(cwd.c_str())[0]; |
| wchar_t offset = wdrive >= L'A' && wdrive <= L'Z' ? L'A' : L'a'; |
| return 'a' + wdrive - offset; |
| } |
| |
| namespace testing { |
| |
| bool TestOnly_NormalizeWindowsPath(const std::string& path, |
| std::string* result) { |
| return NormalizeWindowsPath(path, result); |
| } |
| |
| } // namespace testing |
| |
| } // namespace blaze_util |