| #!/usr/bin/env bash |
| # |
| # Copyright 2019 The Bazel Authors. All rights reserved. |
| # |
| # Licensed under the Apache License, Version 2.0 (the "License"); |
| # you may not use this file except in compliance with the License. |
| # You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| # |
| # Verify handling of Unicode filenames. |
| |
| # --- begin runfiles.bash initialization --- |
| set -euo pipefail |
| if [[ ! -d "${RUNFILES_DIR:-/dev/null}" && ! -f "${RUNFILES_MANIFEST_FILE:-/dev/null}" ]]; then |
| if [[ -f "$0.runfiles_manifest" ]]; then |
| export RUNFILES_MANIFEST_FILE="$0.runfiles_manifest" |
| elif [[ -f "$0.runfiles/MANIFEST" ]]; then |
| export RUNFILES_MANIFEST_FILE="$0.runfiles/MANIFEST" |
| elif [[ -f "$0.runfiles/bazel_tools/tools/bash/runfiles/runfiles.bash" ]]; then |
| export RUNFILES_DIR="$0.runfiles" |
| fi |
| fi |
| if [[ -f "${RUNFILES_DIR:-/dev/null}/bazel_tools/tools/bash/runfiles/runfiles.bash" ]]; then |
| source "${RUNFILES_DIR}/bazel_tools/tools/bash/runfiles/runfiles.bash" |
| elif [[ -f "${RUNFILES_MANIFEST_FILE:-/dev/null}" ]]; then |
| source "$(grep -m1 "^bazel_tools/tools/bash/runfiles/runfiles.bash " \ |
| "$RUNFILES_MANIFEST_FILE" | cut -d ' ' -f 2-)" |
| else |
| echo >&2 "ERROR: cannot find @bazel_tools//tools/bash/runfiles:runfiles.bash" |
| exit 1 |
| fi |
| # --- end runfiles.bash initialization --- |
| |
| source "$(rlocation "io_bazel/src/test/shell/integration_test_setup.sh")" \ |
| || { echo "integration_test_setup.sh not found!" >&2; exit 1; } |
| |
| #### SETUP ############################################################# |
| |
| function unicode_filenames_test_setup() { |
| touch WORKSPACE |
| mkdir -p pkg/srcs |
| |
| cat >pkg/BUILD <<'EOF' |
| load(":rules.bzl", "ls_srcs") |
| ls_srcs( |
| name = "ls_srcs", |
| srcs = glob(["srcs/**/*"]), |
| ) |
| filegroup(name = "filegroup", srcs = glob(["srcs/**/*"])) |
| EOF |
| |
| cat >pkg/rules.bzl <<'EOF' |
| def _ls_srcs(ctx): |
| out = ctx.actions.declare_file(ctx.attr.name) |
| ctx.actions.run_shell( |
| inputs = ctx.files.srcs, |
| outputs = [out], |
| command = 'find -L . > "$1"', |
| arguments = [out.path], |
| ) |
| return DefaultInfo( |
| files = depset(direct = [out]), |
| ) |
| |
| ls_srcs = rule( |
| _ls_srcs, |
| attrs = {"srcs": attr.label_list(allow_files = True)}, |
| ) |
| EOF |
| } |
| |
| function has_iso_8859_1_locale() { |
| charmap="$(LC_ALL=en_US.ISO-8859-1 locale charmap 2>/dev/null)" |
| [[ "${charmap}" == "ISO-8859-1" ]] |
| } |
| |
| function test_utf8_source_artifact() { |
| unicode_filenames_test_setup |
| |
| touch 'pkg/srcs/regular file.txt' |
| |
| mkdir pkg/srcs/subdir |
| touch 'pkg/srcs/subdir/file.txt' |
| |
| # >>> u"pkg/srcs/ünïcödë fïlë.txt".encode("utf8") |
| # 'pkg/srcs/\xc3\xbcn\xc3\xafc\xc3\xb6d\xc3\xab f\xc3\xafl\xc3\xab.txt' |
| touch "$(printf '%b' 'pkg/srcs/\xc3\xbcn\xc3\xafc\xc3\xb6d\xc3\xab f\xc3\xafl\xc3\xab.txt')" |
| |
| bazel build //pkg:ls_srcs >$TEST_log 2>&1 || fail "Should build" |
| |
| assert_contains "pkg/srcs/regular file.txt" bazel-bin/pkg/ls_srcs |
| assert_contains "pkg/srcs/subdir/file.txt" bazel-bin/pkg/ls_srcs |
| assert_contains "pkg/srcs/ünïcödë fïlë.txt" bazel-bin/pkg/ls_srcs |
| } |
| |
| function test_traditional_encoding_source_artifact() { |
| # Windows and macOS require filesystem paths to be valid Unicode. Linux and |
| # the traditional BSDs typically don't, so their paths can contain arbitrary |
| # non-NUL bytes. |
| if (is_windows || is_darwin); then |
| echo "Skipping test." && return |
| fi |
| |
| # Bazel relies on the JVM for filename encoding, and can only support |
| # traditional encodings if it can roundtrip through ISO-8859-1. |
| if ! has_iso_8859_1_locale; then |
| echo "Skipping test (no ISO-8859-1 locale)." |
| echo "Available locales (need en_US.ISO-8859-1):" |
| locale -a |
| return |
| fi |
| |
| unicode_filenames_test_setup |
| |
| # >>> u"pkg/srcs/TRADITIONAL ünïcödë fïlë.txt".encode("iso-8859-1") |
| # 'pkg/srcs/TRADITIONAL \xfcn\xefc\xf6d\xeb f\xefl\xeb.txt' |
| touch "$(printf '%b' 'pkg/srcs/TRADITIONAL \xfcn\xefc\xf6d\xeb f\xefl\xeb.txt')" |
| |
| bazel build //pkg:ls_srcs >$TEST_log 2>&1 || fail "Should build" |
| assert_contains "pkg/srcs/TRADITIONAL " bazel-bin/pkg/ls_srcs |
| } |
| |
| function test_utf8_source_artifact_in_bep() { |
| unicode_filenames_test_setup |
| |
| touch 'pkg/srcs/regular file.txt' |
| |
| mkdir pkg/srcs/subdir |
| touch 'pkg/srcs/subdir/file.txt' |
| |
| # >>> u"pkg/srcs/ünïcödë fïlë.txt".encode("utf8") |
| # 'pkg/srcs/\xc3\xbcn\xc3\xafc\xc3\xb6d\xc3\xab f\xc3\xafl\xc3\xab.txt' |
| touch "$(printf '%b' 'pkg/srcs/\xc3\xbcn\xc3\xafc\xc3\xb6d\xc3\xab f\xc3\xafl\xc3\xab.txt')" |
| |
| bazel build --build_event_json_file="$TEST_log" \ |
| //pkg:filegroup 2>&1 || fail "Should build" |
| |
| expect_log '"name":"pkg/srcs/regular file.txt"' |
| expect_log '"name":"pkg/srcs/subdir/file.txt"' |
| expect_log '"name":"pkg/srcs/ünïcödë fïlë.txt"' |
| } |
| |
| function test_utf8_filename_in_java_test() { |
| add_rules_java "MODULE.bazel" |
| touch WORKSPACE |
| mkdir pkg |
| |
| cat >pkg/BUILD <<'EOF' |
| load("@rules_java//java:java_test.bzl", "java_test") |
| |
| java_test( |
| name = "Test", |
| srcs = ["Test.java"], |
| main_class = "Test", |
| use_testrunner = False, |
| ) |
| EOF |
| |
| cat >pkg/Test.java <<'EOF' |
| import java.nio.file.Files; |
| import java.io.IOException; |
| |
| class Test { |
| public static void main(String[] args) throws IOException { |
| Files.createTempFile("æøå", null); |
| } |
| } |
| EOF |
| |
| bazel test //pkg:Test --test_output=errors 2>$TEST_log || fail "Test should pass" |
| } |
| |
| function test_cc_dependency_with_utf8_filename() { |
| # TODO: Find a way to get cl.exe to output Unicode when not running in a |
| # console or migrate to /sourceDependencies. |
| if is_windows; then |
| echo "Skipping test on Windows." && return |
| fi |
| |
| local unicode="äöüÄÖÜß🌱" |
| |
| setup_module_dot_bazel |
| |
| mkdir pkg |
| cat >pkg/BUILD <<EOF |
| cc_library( |
| name = "lib", |
| hdrs = ["${unicode}.h"], |
| ) |
| cc_binary( |
| name = "bin", |
| srcs = ["bin.cc"], |
| deps = [":lib"], |
| ) |
| EOF |
| cat >"pkg/${unicode}.h" <<EOF |
| #define MY_STRING "original" |
| EOF |
| # MSVC requires UTF-8 source files to start with a BOM. |
| printf '\xEF\xBB\xBF' > pkg/bin.cc |
| cat >>pkg/bin.cc <<EOF |
| #include "${unicode}.h" |
| |
| #include <iostream> |
| |
| int main() { |
| std::cout << MY_STRING << std::endl; |
| return 0; |
| } |
| EOF |
| bazel run //pkg:bin >$TEST_log 2>&1 || fail "Should build" |
| expect_log "original" |
| |
| # Change the header file and rebuild |
| cat >"pkg/${unicode}.h" <<EOF |
| #define MY_STRING "changed" |
| EOF |
| bazel run //pkg:bin >$TEST_log 2>&1 || fail "Should build" |
| expect_log "changed" |
| } |
| |
| function test_unicode_in_path() { |
| mkdir -p pkg |
| cat >pkg/BUILD <<'EOF' |
| load(":defs.bzl", "my_rule") |
| |
| my_rule(name = "my_rule") |
| EOF |
| cat >pkg/defs.bzl <<'EOF' |
| def _my_rule_impl(ctx): |
| out = ctx.actions.declare_file(ctx.attr.name) |
| ctx.actions.run_shell( |
| outputs = [out], |
| command = "touch $1", |
| arguments = [out.path], |
| use_default_shell_env = True, |
| ) |
| return DefaultInfo( |
| files = depset(direct = [out]), |
| ) |
| |
| my_rule = rule(_my_rule_impl) |
| EOF |
| |
| # MSYS2 uses : as a path separator even on Windows. |
| export PATH="$PATH:äöüÄÖÜß🌱" |
| # Restart the server since PATH is taken from the server environment on Windows. |
| bazel shutdown > /dev/null 2>&1 || fail "Should shutdown" |
| |
| bazel build //pkg:my_rule >$TEST_log 2>&1 || fail "Should build" |
| } |
| |
| run_suite "Tests for handling of Unicode filenames" |