blob: 8f0e37c206527b43f48ea9dd1f90ff754d75d1c2 [file] [log] [blame]
# Copyright 2021 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""Utilities and helper rules for Java fuzz tests."""
load("//fuzzing/private:binary.bzl", "fuzzing_binary_transition")
load("//fuzzing/private:util.bzl", "runfile_path")
# A Starlark reimplementation of a part of Bazel's JavaCommon#determinePrimaryClass.
def determine_primary_class(srcs, name):
main_source_path = _get_java_main_source_path(srcs, name)
return _get_java_full_classname(main_source_path)
# A Starlark reimplementation of a part of Bazel's JavaCommon#determinePrimaryClass.
def _get_java_main_source_path(srcs, name):
main_source_basename = name + ".java"
for source_file in srcs:
if source_file[source_file.rfind("/") + 1:] == main_source_basename:
main_source_basename = source_file
break
return native.package_name() + "/" + main_source_basename[:-len(".java")]
# A Starlark reimplementation of Bazel's JavaUtil#getJavaFullClassname.
def _get_java_full_classname(main_source_path):
java_path = _get_java_path(main_source_path)
if java_path != None:
return java_path.replace("/", ".")
return None
# A Starlark reimplementation of Bazel's JavaUtil#getJavaPath.
def _get_java_path(main_source_path):
path_segments = main_source_path.split("/")
index = _java_segment_index(path_segments)
if index >= 0:
return "/".join(path_segments[index + 1:])
return None
_KNOWN_SOURCE_ROOTS = ["java", "javatests", "src", "testsrc"]
# A Starlark reimplementation of Bazel's JavaUtil#javaSegmentIndex.
def _java_segment_index(path_segments):
root_index = -1
for pos, segment in enumerate(path_segments):
if segment in _KNOWN_SOURCE_ROOTS:
root_index = pos
break
if root_index == -1:
return root_index
is_src = "src" == path_segments[root_index]
check_maven_index = root_index if is_src else -1
max = len(path_segments) - 1
if root_index == 0 or is_src:
for i in range(root_index + 1, max):
segment = path_segments[i]
if "src" == segment or (is_src and ("javatests" == segment or "java" == segment)):
next = path_segments[i + 1]
if ("com" == next or "org" == next or "net" == next):
root_index = i
elif "src" == segment:
check_maven_index = i
break
if check_maven_index >= 0 and check_maven_index + 2 < len(path_segments):
next = path_segments[check_maven_index + 1]
if "main" == next or "test" == next:
next = path_segments[check_maven_index + 2]
if "java" == next or "resources" == next:
root_index = check_maven_index + 2
return root_index
def _jazzer_fuzz_binary_script(ctx, native_libs, driver):
script = ctx.actions.declare_file(ctx.label.name)
# The script is split into two parts: The first is emitted as-is, the second
# is a template that is passed to format(). Without the split, curly braces
# in the first part would need to be escaped.
script_literal_part = """#!/bin/bash
# LLVMFuzzerTestOneInput - OSS-Fuzz needs this string literal to appear
# somewhere in the script so it is recognized as a fuzz target.
# Bazel-provided code snippet that should be copy-pasted as is at use sites.
# Taken from @bazel_tools//tools/bash/runfiles.
# --- begin runfiles.bash initialization v2 ---
# Copy-pasted from the Bazel Bash runfiles library v2.
set -uo pipefail; f=bazel_tools/tools/bash/runfiles/runfiles.bash
source "${RUNFILES_DIR:-/dev/null}/$f" 2>/dev/null || \
source "$(grep -sm1 "^$f " "${RUNFILES_MANIFEST_FILE:-/dev/null}" | cut -f2- -d' ')" 2>/dev/null || \
source "$0.runfiles/$f" 2>/dev/null || \
source "$(grep -sm1 "^$f " "$0.runfiles_manifest" | cut -f2- -d' ')" 2>/dev/null || \
source "$(grep -sm1 "^$f " "$0.exe.runfiles_manifest" | cut -f2- -d' ')" 2>/dev/null || \
{ echo>&2 "ERROR: cannot find $f"; exit 1; }; f=; set -e
# --- end runfiles.bash initialization v2 ---
# Export the env variables required for subprocesses to find their runfiles.
runfiles_export_envvars
# Determine the path to load libjvm.so from, either relative to the location of
# the java binary or to $JAVA_HOME, if set. On OSS-Fuzz, the path is provided in
# JVM_LD_LIBRARY_PATH.
JAVA_BIN=$(readlink -f "$(which java)")
JAVA_HOME=${JAVA_HOME:-${JAVA_BIN%/bin/java}}
# The location of libjvm.so relative to the JDK differs between JDK <= 8 and 9+.
JVM_LD_LIBRARY_PATH=${JVM_LD_LIBRARY_PATH:-"$JAVA_HOME/lib/server:$JAVA_HOME/lib/amd64/server"}
export LD_LIBRARY_PATH=${LD_LIBRARY_PATH:+$LD_LIBRARY_PATH:}$JVM_LD_LIBRARY_PATH
"""
script_format_part = """
source "$(rlocation {sanitizer_options})"
exec "$(rlocation {driver})" \
--agent_path="$(rlocation {agent})" \
--cp="$(rlocation {deploy_jar})" \
--jvm_args="-Djava.library.path={native_dirs}" \
"$@"
"""
native_dirs = [
"$(dirname \"$(rlocation %s)\")" % runfile_path(ctx, lib)
for lib in native_libs
]
script_content = script_literal_part + script_format_part.format(
agent = runfile_path(ctx, ctx.file.agent),
deploy_jar = runfile_path(ctx, ctx.file.target_deploy_jar),
driver = runfile_path(ctx, driver),
native_dirs = ":".join(native_dirs),
sanitizer_options = runfile_path(ctx, ctx.file.sanitizer_options),
)
ctx.actions.write(script, script_content, is_executable = True)
return script
def _is_required_runfile(runfile, runtime_classpath = []):
# The jars in the runtime classpath are all merged into the deploy jar and
# thus don't need to be included in the runfiles for the fuzzer.
if runfile in runtime_classpath:
return False
# A java_binary target has a dependency on the local JDK. Since the Jazzer
# driver launches its own JVM, these runfiles are not needed.
if runfile.owner != None and runfile.owner.workspace_name == "local_jdk":
return False
return True
def _filter_target_runfiles(ctx, target):
compilation_info = target[JavaInfo].compilation_info
runtime_classpath = compilation_info.runtime_classpath.to_list()
all_runfiles = target[DefaultInfo].default_runfiles
return ctx.runfiles([
runfile
for runfile in all_runfiles.files.to_list()
if _is_required_runfile(runfile, runtime_classpath)
])
def _is_potential_native_dependency(file):
if file.extension not in ["dll", "dylib", "so"]:
return False
if not _is_required_runfile(file):
return False
return True
def _native_library_files(ctx):
target_info = ctx.attr.target[0][DefaultInfo]
target_java_info = ctx.attr.target[0][JavaInfo]
# Perform feature detection for
# https://github.com/bazelbuild/bazel/commit/381a519dfc082d4c62096c4ce77ead1c2e0410d8.
if hasattr(target_java_info, "transitive_native_libraries"):
# The current version of Bazel contains the commit, which means that
# the JavaInfo of the target includes information about all transitive
# native library dependencies.
native_libraries_list = target_java_info.transitive_native_libraries.to_list()
return [lib.dynamic_library for lib in native_libraries_list]
else:
# If precise information about transitive native libraries is not
# available, fall back to an overapproximation that includes all
# runfiles with file extensions indicating a shared library.
runfiles_list = target_info.default_runfiles.files.to_list()
return [
runfile
for runfile in runfiles_list
if _is_potential_native_dependency(runfile)
]
def _jazzer_fuzz_binary_impl(ctx):
native_libs = _native_library_files(ctx)
# Use a driver with a linked in sanitizer if the fuzz test has native
# dependencies.
if native_libs:
driver = ctx.executable.driver_with_native
driver_info = ctx.attr.driver_with_native[DefaultInfo]
else:
driver = ctx.executable.driver_java_only
driver_info = ctx.attr.driver_java_only[DefaultInfo]
# The DefaultInfo's default_runfiles of an executable file target do not
# contain the executable itself, which thus needs to be added explicitly.
driver_runfiles = driver_info.default_runfiles
driver_executable = driver_info.files_to_run.executable
driver_runfiles = driver_runfiles.merge(ctx.runfiles([driver_executable]))
runfiles = ctx.runfiles()
runfiles = runfiles.merge(driver_runfiles)
# Used by the wrapper script created in _jazzer_fuzz_binary_script.
runfiles = runfiles.merge(ctx.attr._bash_runfiles_library[DefaultInfo].default_runfiles)
# While the Jazzer agent is already included in the runfiles of
# @jazzer//driver:jazzer_driver, it has to be added here explicitly for the
# case where both are provided by OSS-Fuzz.
runfiles = runfiles.merge(ctx.runfiles([ctx.file.agent]))
# The Java fuzz target packaged as a jar including all Java dependencies.
# This does not include e.g. data runfiles and shared libraries.
runfiles = runfiles.merge(ctx.runfiles([ctx.file.target_deploy_jar]))
# The full runfiles of the Java fuzz target, but with the files of the local
# JDK and all jar files excluded.
runfiles = runfiles.merge(_filter_target_runfiles(ctx, ctx.attr.target[0]))
runfiles = runfiles.merge(ctx.runfiles([ctx.file.sanitizer_options]))
script = _jazzer_fuzz_binary_script(ctx, native_libs, driver)
return [DefaultInfo(executable = script, runfiles = runfiles)]
jazzer_fuzz_binary = rule(
implementation = _jazzer_fuzz_binary_impl,
doc = """
Rule that creates a binary that invokes Jazzer on the specified target.
""",
attrs = {
"agent": attr.label(
doc = "The Jazzer agent used to instrument the target.",
allow_single_file = [".jar"],
),
"_bash_runfiles_library": attr.label(
default = "@bazel_tools//tools/bash/runfiles",
),
"driver_java_only": attr.label(
doc = "The Jazzer driver binary used to fuzz a Java-only target.",
allow_single_file = True,
executable = True,
# Build in target configuration rather than host because the driver
# uses transitions to set the correct C++ standard for its
# dependencies.
cfg = "target",
),
"driver_with_native": attr.label(
doc = "The Jazzer driver binary used to fuzz a Java target with " +
"native dependencies.",
allow_single_file = True,
executable = True,
# Build in target configuration rather than host because the driver
# uses transitions to set the correct C++ standard for its
# dependencies.
cfg = "target",
),
"sanitizer_options": attr.label(
doc = "A shell script that can export environment variables with " +
"sanitizer options.",
allow_single_file = [".sh"],
),
"target": attr.label(
doc = "The fuzz target.",
mandatory = True,
providers = [JavaInfo],
cfg = fuzzing_binary_transition,
),
"target_deploy_jar": attr.label(
doc = "The deploy jar of the fuzz target.",
allow_single_file = [".jar"],
mandatory = True,
),
"_allowlist_function_transition": attr.label(
default = "@bazel_tools//tools/allowlists/function_transition_allowlist",
),
},
executable = True,
)