blob: 569a3e223a49c3a1795cefe1b69f9d77cd34a89c [file] [log] [blame]
// Copyright 2015 The Bazel Authors. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// classfile.cc -- classfile parsing and stripping.
//
// TODO(adonovan) don't pass pointers by reference; this is not
// compatible with Google C++ style.
// See README.txt for details.
//
// For definition of JVM class file format, see:
// Java SE 8 Edition:
// http://docs.oracle.com/javase/specs/jvms/se8/html/jvms-4.html#jvms-4
#define __STDC_FORMAT_MACROS 1
#define __STDC_LIMIT_MACROS 1
#include <inttypes.h> // for PRIx32
#include <stddef.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <set>
#include <sstream>
#include <string>
#include <unordered_set>
#include <vector>
#include "third_party/ijar/common.h"
namespace {
// Converts a value to string.
// Workaround for mingw where std::to_string is not implemented.
// See https://gcc.gnu.org/bugzilla/show_bug.cgi?id=52015.
template <typename T>
std::string ToString(const T& value) {
std::ostringstream oss;
oss << value;
return oss.str();
}
} // namespace
namespace devtools_ijar {
// See Table 4.4 in JVM 17 Spec.
enum CONSTANT {
CONSTANT_Class = 7,
CONSTANT_FieldRef = 9,
CONSTANT_Methodref = 10,
CONSTANT_Interfacemethodref = 11,
CONSTANT_String = 8,
CONSTANT_Integer = 3,
CONSTANT_Float = 4,
CONSTANT_Long = 5,
CONSTANT_Double = 6,
CONSTANT_NameAndType = 12,
CONSTANT_Utf8 = 1,
CONSTANT_MethodHandle = 15,
CONSTANT_MethodType = 16,
CONSTANT_Dynamic = 17,
CONSTANT_InvokeDynamic = 18
};
// See Tables 4.1, 4.4, 4.5 in JVM Spec.
enum ACCESS {
ACC_PUBLIC = 0x0001,
ACC_PRIVATE = 0x0002,
ACC_PROTECTED = 0x0004,
ACC_STATIC = 0x0008,
ACC_FINAL = 0x0010,
ACC_SYNCHRONIZED = 0x0020,
ACC_BRIDGE = 0x0040,
ACC_VOLATILE = 0x0040,
ACC_TRANSIENT = 0x0080,
ACC_INTERFACE = 0x0200,
ACC_ABSTRACT = 0x0400,
ACC_SYNTHETIC = 0x1000
};
// See Table 4.7.20-A in Java 8 JVM Spec.
enum TARGET_TYPE {
// Targets for type parameter declarations (ElementType.TYPE_PARAMETER):
CLASS_TYPE_PARAMETER = 0x00,
METHOD_TYPE_PARAMETER = 0x01,
// Targets for type uses that may be externally visible in classes and members
// (ElementType.TYPE_USE):
CLASS_EXTENDS = 0x10,
CLASS_TYPE_PARAMETER_BOUND = 0x11,
METHOD_TYPE_PARAMETER_BOUND = 0x12,
FIELD = 0x13,
METHOD_RETURN = 0x14,
METHOD_RECEIVER = 0x15,
METHOD_FORMAL_PARAMETER = 0x16,
THROWS = 0x17,
// TARGET_TYPE >= 0x40 is reserved for type uses that occur only within code
// blocks. Ijar doesn't need to know about these.
};
struct Constant;
// TODO(adonovan) these globals are unfortunate
static std::vector<Constant *> const_pool_in; // input constant pool
static std::vector<Constant *> const_pool_out; // output constant_pool
static std::set<std::string> used_class_names;
static Constant *class_name;
static std::unordered_set<std::string> unknown_attributes;
// Returns the Constant object, given an index into the input constant pool.
// Note: constant(0) == NULL; this invariant is exploited by the
// InnerClassesAttribute, inter alia.
inline Constant *constant(int idx) {
if (idx < 0 || (unsigned)idx >= const_pool_in.size()) {
fprintf(stderr, "Illegal constant pool index: %d\n", idx);
abort();
}
return const_pool_in[idx];
}
/**********************************************************************
* *
* Constants *
* *
**********************************************************************/
// See sec.4.4 of JVM spec.
struct Constant {
Constant(u1 tag) :
slot_(0),
tag_(tag) {}
virtual ~Constant() {}
// For UTF-8 string constants, returns the encoded string.
// Otherwise, returns an undefined string value suitable for debugging.
virtual std::string Display() = 0;
virtual void Write(u1 *&p) = 0;
// Called by slot() when a constant has been identified as required
// in the output classfile's constant pool. This is a hook allowing
// constants to register their dependency on other constants, by
// calling slot() on them in turn.
virtual void Keep() {}
bool Kept() {
return slot_ != 0;
}
// Returns the index of this constant in the output class's constant
// pool, assigning a slot if not already done.
u2 slot() {
if (slot_ == 0) {
Keep();
slot_ = const_pool_out.size(); // BugBot's "narrowing" warning
// is bogus. The number of
// output constants can't exceed
// the number of input constants.
if (slot_ == 0) {
fprintf(stderr, "Constant::slot() called before output phase.\n");
abort();
}
const_pool_out.push_back(this);
if (tag_ == CONSTANT_Long || tag_ == CONSTANT_Double) {
const_pool_out.push_back(NULL);
}
}
return slot_;
}
u2 slot_; // zero => "this constant is unreachable garbage"
u1 tag_;
};
// Extracts class names from a signature and puts them into the global
// variable used_class_names.
//
// desc: the descriptor class names should be extracted from.
// p: the position where the extraction should tart.
void ExtractClassNames(const std::string& desc, size_t* p);
// See sec.4.4.1 of JVM spec.
struct Constant_Class : Constant
{
Constant_Class(u2 name_index) :
Constant(CONSTANT_Class),
name_index_(name_index) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, constant(name_index_)->slot());
}
std::string Display() {
return constant(name_index_)->Display();
}
void Keep() { constant(name_index_)->slot(); }
u2 name_index_;
};
// See sec.4.4.2 of JVM spec.
struct Constant_FMIref : Constant
{
Constant_FMIref(u1 tag,
u2 class_index,
u2 name_type_index) :
Constant(tag),
class_index_(class_index),
name_type_index_(name_type_index) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, constant(class_index_)->slot());
put_u2be(p, constant(name_type_index_)->slot());
}
std::string Display() {
return constant(class_index_)->Display() + "::" +
constant(name_type_index_)->Display();
}
void Keep() {
constant(class_index_)->slot();
constant(name_type_index_)->slot();
}
u2 class_index_;
u2 name_type_index_;
};
// See sec.4.4.3 of JVM spec.
struct Constant_String : Constant
{
Constant_String(u2 string_index) :
Constant(CONSTANT_String),
string_index_(string_index) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, constant(string_index_)->slot());
}
std::string Display() {
return "\"" + constant(string_index_)->Display() + "\"";
}
void Keep() { constant(string_index_)->slot(); }
u2 string_index_;
};
// See sec.4.4.4 of JVM spec.
struct Constant_IntegerOrFloat : Constant
{
Constant_IntegerOrFloat(u1 tag, u4 bytes) :
Constant(tag),
bytes_(bytes) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u4be(p, bytes_);
}
std::string Display() { return "int/float"; }
u4 bytes_;
};
// See sec.4.4.5 of JVM spec.
struct Constant_LongOrDouble : Constant_IntegerOrFloat
{
Constant_LongOrDouble(u1 tag, u4 high_bytes, u4 low_bytes) :
Constant_IntegerOrFloat(tag, high_bytes),
low_bytes_(low_bytes) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u4be(p, bytes_);
put_u4be(p, low_bytes_);
}
std::string Display() { return "long/double"; }
u4 low_bytes_;
};
// See sec.4.4.6 of JVM spec.
struct Constant_NameAndType : Constant
{
Constant_NameAndType(u2 name_index, u2 descr_index) :
Constant(CONSTANT_NameAndType),
name_index_(name_index),
descr_index_(descr_index) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, constant(name_index_)->slot());
put_u2be(p, constant(descr_index_)->slot());
}
std::string Display() {
return constant(name_index_)->Display() + "::" +
constant(descr_index_)->Display();
}
void Keep() {
constant(name_index_)->slot();
constant(descr_index_)->slot();
}
u2 name_index_;
u2 descr_index_;
};
// See sec.4.4.7 of JVM spec.
struct Constant_Utf8 : Constant
{
Constant_Utf8(u4 length, const u1 *utf8) :
Constant(CONSTANT_Utf8),
length_(length),
utf8_(utf8) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, length_);
put_n(p, utf8_, length_);
}
std::string Display() {
return std::string((const char*) utf8_, length_);
}
u4 length_;
const u1 *utf8_;
};
// See sec.4.4.8 of JVM spec.
struct Constant_MethodHandle : Constant
{
Constant_MethodHandle(u1 reference_kind, u2 reference_index) :
Constant(CONSTANT_MethodHandle),
reference_kind_(reference_kind),
reference_index_(reference_index) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u1(p, reference_kind_);
put_u2be(p, reference_index_);
}
std::string Display() {
return "Constant_MethodHandle::" + ToString(reference_kind_) + "::"
+ constant(reference_index_)->Display();
}
u1 reference_kind_;
u2 reference_index_;
};
// See sec.4.4.9 of JVM spec.
struct Constant_MethodType : Constant
{
Constant_MethodType(u2 descriptor_index) :
Constant(CONSTANT_MethodType),
descriptor_index_(descriptor_index) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, descriptor_index_);
}
std::string Display() {
return "Constant_MethodType::" + constant(descriptor_index_)->Display();
}
u2 descriptor_index_;
};
// See sec.4.4.10 of JVM spec.
struct Constant_Dynamic : Constant {
Constant_Dynamic(u2 bootstrap_method_attr_index, u2 name_and_type_index)
: Constant(CONSTANT_Dynamic),
bootstrap_method_attr_index_(bootstrap_method_attr_index),
name_and_type_index_(name_and_type_index) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, bootstrap_method_attr_index_);
put_u2be(p, name_and_type_index_);
}
std::string Display() {
return "Constant_Dynamic::" + ToString(bootstrap_method_attr_index_) +
"::" + constant(name_and_type_index_)->Display();
}
u2 bootstrap_method_attr_index_;
u2 name_and_type_index_;
};
struct Constant_InvokeDynamic : Constant {
Constant_InvokeDynamic(u2 bootstrap_method_attr_index, u2 name_and_type_index)
: Constant(CONSTANT_InvokeDynamic),
bootstrap_method_attr_index_(bootstrap_method_attr_index),
name_and_type_index_(name_and_type_index) {}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, bootstrap_method_attr_index_);
put_u2be(p, name_and_type_index_);
}
std::string Display() {
return "Constant_InvokeDynamic::"
+ ToString(bootstrap_method_attr_index_) + "::"
+ constant(name_and_type_index_)->Display();
}
u2 bootstrap_method_attr_index_;
u2 name_and_type_index_;
};
/**********************************************************************
* *
* Attributes *
* *
**********************************************************************/
// See sec.4.7 of JVM spec.
struct Attribute {
virtual ~Attribute() {}
virtual void Write(u1 *&p) = 0;
virtual void ExtractClassNames() {}
virtual bool KeepForCompile() const { return false; }
void WriteProlog(u1 *&p, u2 length) {
put_u2be(p, attribute_name_->slot());
put_u4be(p, length);
}
Constant *attribute_name_;
};
struct HasAttrs {
std::vector<Attribute*> attributes;
void WriteAttrs(u1 *&p);
void ReadAttrs(const u1 *&p);
virtual ~HasAttrs() {
for (const auto *attribute : attributes) {
delete attribute;
}
}
void ExtractClassNames() {
for (auto *attribute : attributes) {
attribute->ExtractClassNames();
}
}
};
// See sec.4.7.5 of JVM spec.
struct ExceptionsAttribute : Attribute {
static ExceptionsAttribute* Read(const u1 *&p, Constant *attribute_name) {
ExceptionsAttribute *attr = new ExceptionsAttribute;
attr->attribute_name_ = attribute_name;
u2 number_of_exceptions = get_u2be(p);
for (int ii = 0; ii < number_of_exceptions; ++ii) {
attr->exceptions_.push_back(constant(get_u2be(p)));
}
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, exceptions_.size() * 2 + 2);
put_u2be(p, exceptions_.size());
for (size_t ii = 0; ii < exceptions_.size(); ++ii) {
put_u2be(p, exceptions_[ii]->slot());
}
}
std::vector<Constant*> exceptions_;
};
// See sec.4.7.6 of JVM spec.
struct InnerClassesAttribute : Attribute {
struct Entry {
Constant *inner_class_info;
Constant *outer_class_info;
Constant *inner_name;
u2 inner_class_access_flags;
};
virtual ~InnerClassesAttribute() {
for (size_t i = 0; i < entries_.size(); i++) {
delete entries_[i];
}
}
static InnerClassesAttribute* Read(const u1 *&p, Constant *attribute_name) {
InnerClassesAttribute *attr = new InnerClassesAttribute;
attr->attribute_name_ = attribute_name;
u2 number_of_classes = get_u2be(p);
for (int ii = 0; ii < number_of_classes; ++ii) {
Entry *entry = new Entry;
entry->inner_class_info = constant(get_u2be(p));
entry->outer_class_info = constant(get_u2be(p));
entry->inner_name = constant(get_u2be(p));
entry->inner_class_access_flags = get_u2be(p);
attr->entries_.push_back(entry);
}
return attr;
}
void Write(u1 *&p) {
std::set<int> kept_entries;
// We keep an entry if the constant referring to the inner class is already
// kept. Then we mark its outer class and its class name as kept, too, then
// iterate until a fixed point is reached.
int entry_count;
do {
entry_count = kept_entries.size();
for (int i_entry = 0; i_entry < static_cast<int>(entries_.size());
++i_entry) {
Entry* entry = entries_[i_entry];
if (entry->inner_class_info->Kept() ||
used_class_names.find(entry->inner_class_info->Display()) !=
used_class_names.end() ||
entry->outer_class_info == class_name) {
if (entry->inner_name == NULL) {
// JVMS 4.7.6: inner_name_index is zero iff the class is anonymous
continue;
}
kept_entries.insert(i_entry);
// JVMS 4.7.6: outer_class_info_index is zero for top-level classes
if (entry->outer_class_info != NULL) {
entry->outer_class_info->slot();
}
entry->inner_name->slot();
}
}
} while (entry_count != static_cast<int>(kept_entries.size()));
if (kept_entries.empty()) {
return;
}
WriteProlog(p, 2 + kept_entries.size() * 8);
put_u2be(p, kept_entries.size());
for (std::set<int>::iterator it = kept_entries.begin();
it != kept_entries.end();
++it) {
Entry *entry = entries_[*it];
put_u2be(p, entry->inner_class_info == NULL
? 0
: entry->inner_class_info->slot());
put_u2be(p, entry->outer_class_info == NULL
? 0
: entry->outer_class_info->slot());
put_u2be(p, entry->inner_name == NULL
? 0
: entry->inner_name->slot());
put_u2be(p, entry->inner_class_access_flags);
}
}
std::vector<Entry*> entries_;
};
// See sec.4.7.7 of JVM spec.
// We preserve EnclosingMethod attributes to be able to identify local and
// anonymous classes. These classes will be stripped of most content, as they
// represent implementation details that shoudn't leak into the ijars. Omitting
// EnclosingMethod attributes can lead to type-checking failures in the presence
// of generics (see b/9070939).
struct EnclosingMethodAttribute : Attribute {
static EnclosingMethodAttribute* Read(const u1 *&p,
Constant *attribute_name) {
EnclosingMethodAttribute *attr = new EnclosingMethodAttribute;
attr->attribute_name_ = attribute_name;
attr->class_ = constant(get_u2be(p));
attr->method_ = constant(get_u2be(p));
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, 4);
put_u2be(p, class_->slot());
put_u2be(p, method_ == NULL ? 0 : method_->slot());
}
Constant *class_;
Constant *method_;
};
// See sec.4.7.16.1 of JVM spec.
// Used by AnnotationDefault and other attributes.
struct ElementValue {
virtual ~ElementValue() {}
virtual void Write(u1 *&p) = 0;
virtual void ExtractClassNames() {}
static ElementValue* Read(const u1 *&p);
u1 tag_;
u4 length_;
};
struct BaseTypeElementValue : ElementValue {
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, const_value_->slot());
}
static BaseTypeElementValue *Read(const u1 *&p) {
BaseTypeElementValue *value = new BaseTypeElementValue;
value->const_value_ = constant(get_u2be(p));
return value;
}
Constant *const_value_;
};
struct EnumTypeElementValue : ElementValue {
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, type_name_->slot());
put_u2be(p, const_name_->slot());
}
static EnumTypeElementValue *Read(const u1 *&p) {
EnumTypeElementValue *value = new EnumTypeElementValue;
value->type_name_ = constant(get_u2be(p));
value->const_name_ = constant(get_u2be(p));
return value;
}
Constant *type_name_;
Constant *const_name_;
};
struct ClassTypeElementValue : ElementValue {
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, class_info_->slot());
}
virtual void ExtractClassNames() {
size_t idx = 0;
devtools_ijar::ExtractClassNames(class_info_->Display(), &idx);
}
static ClassTypeElementValue *Read(const u1 *&p) {
ClassTypeElementValue *value = new ClassTypeElementValue;
value->class_info_ = constant(get_u2be(p));
return value;
}
Constant *class_info_;
};
struct ArrayTypeElementValue : ElementValue {
virtual ~ArrayTypeElementValue() {
for (const auto *value : values_) {
delete value;
}
}
virtual void ExtractClassNames() {
for (auto *value : values_) {
value->ExtractClassNames();
}
}
void Write(u1 *&p) {
put_u1(p, tag_);
put_u2be(p, values_.size());
for (auto *value : values_) {
value->Write(p);
}
}
static ArrayTypeElementValue *Read(const u1 *&p) {
ArrayTypeElementValue *value = new ArrayTypeElementValue;
u2 num_values = get_u2be(p);
for (int ii = 0; ii < num_values; ++ii) {
value->values_.push_back(ElementValue::Read(p));
}
return value;
}
std::vector<ElementValue*> values_;
};
// See sec.4.7.16 of JVM spec.
struct Annotation {
virtual ~Annotation() {
for (size_t i = 0; i < element_value_pairs_.size(); i++) {
delete element_value_pairs_[i]->element_value_;
delete element_value_pairs_[i];
}
}
void ExtractClassNames() {
for (size_t i = 0; i < element_value_pairs_.size(); i++) {
element_value_pairs_[i]->element_value_->ExtractClassNames();
}
}
void Write(u1 *&p) {
put_u2be(p, type_->slot());
put_u2be(p, element_value_pairs_.size());
for (size_t ii = 0; ii < element_value_pairs_.size(); ++ii) {
put_u2be(p, element_value_pairs_[ii]->element_name_->slot());
element_value_pairs_[ii]->element_value_->Write(p);
}
}
static Annotation *Read(const u1 *&p) {
Annotation *value = new Annotation;
value->type_ = constant(get_u2be(p));
u2 num_element_value_pairs = get_u2be(p);
for (int ii = 0; ii < num_element_value_pairs; ++ii) {
ElementValuePair *pair = new ElementValuePair;
pair->element_name_ = constant(get_u2be(p));
pair->element_value_ = ElementValue::Read(p);
value->element_value_pairs_.push_back(pair);
}
return value;
}
Constant *type_;
struct ElementValuePair {
Constant *element_name_;
ElementValue *element_value_;
};
std::vector<ElementValuePair*> element_value_pairs_;
};
// See sec 4.7.20 of Java 8 JVM Spec
//
// Each entry in the annotations table represents a single run-time visible
// annotation on a type used in a declaration or expression. The type_annotation
// structure has the following format:
//
// type_annotation {
// u1 target_type;
// union {
// type_parameter_target;
// supertype_target;
// type_parameter_bound_target;
// empty_target;
// method_formal_parameter_target;
// throws_target;
// localvar_target;
// catch_target;
// offset_target;
// type_argument_target;
// } target_info;
// type_path target_path;
// u2 type_index;
// u2 num_element_value_pairs;
// {
// u2 element_name_index;
// element_value value;
// }
// element_value_pairs[num_element_value_pairs];
// }
//
struct TypeAnnotation {
virtual ~TypeAnnotation() {
delete target_info_;
delete type_path_;
delete annotation_;
}
void ExtractClassNames() {
annotation_->ExtractClassNames();
}
void Write(u1 *&p) {
put_u1(p, target_type_);
target_info_->Write(p);
type_path_->Write(p);
annotation_->Write(p);
}
static TypeAnnotation *Read(const u1 *&p) {
TypeAnnotation *value = new TypeAnnotation;
value->target_type_ = get_u1(p);
value->target_info_ = ReadTargetInfo(p, value->target_type_);
value->type_path_ = TypePath::Read(p);
value->annotation_ = Annotation::Read(p);
return value;
}
struct TargetInfo {
virtual ~TargetInfo() {}
virtual void Write(u1 *&p) = 0;
};
struct TypeParameterTargetInfo : TargetInfo {
void Write(u1 *&p) {
put_u1(p, type_parameter_index_);
}
static TypeParameterTargetInfo *Read(const u1 *&p) {
TypeParameterTargetInfo *value = new TypeParameterTargetInfo;
value->type_parameter_index_ = get_u1(p);
return value;
}
u1 type_parameter_index_;
};
struct ClassExtendsInfo : TargetInfo {
void Write(u1 *&p) {
put_u2be(p, supertype_index_);
}
static ClassExtendsInfo *Read(const u1 *&p) {
ClassExtendsInfo *value = new ClassExtendsInfo;
value->supertype_index_ = get_u2be(p);
return value;
}
u2 supertype_index_;
};
struct TypeParameterBoundInfo : TargetInfo {
void Write(u1 *&p) {
put_u1(p, type_parameter_index_);
put_u1(p, bound_index_);
}
static TypeParameterBoundInfo *Read(const u1 *&p) {
TypeParameterBoundInfo *value = new TypeParameterBoundInfo;
value->type_parameter_index_ = get_u1(p);
value->bound_index_ = get_u1(p);
return value;
}
u1 type_parameter_index_;
u1 bound_index_;
};
struct EmptyInfo : TargetInfo {
void Write(u1 *& /*p*/) {}
static EmptyInfo *Read(const u1 *& /*p*/) { return new EmptyInfo; }
};
struct MethodFormalParameterInfo : TargetInfo {
void Write(u1 *&p) {
put_u1(p, method_formal_parameter_index_);
}
static MethodFormalParameterInfo *Read(const u1 *&p) {
MethodFormalParameterInfo *value = new MethodFormalParameterInfo;
value->method_formal_parameter_index_ = get_u1(p);
return value;
}
u1 method_formal_parameter_index_;
};
struct ThrowsTypeInfo : TargetInfo {
void Write(u1 *&p) {
put_u2be(p, throws_type_index_);
}
static ThrowsTypeInfo *Read(const u1 *&p) {
ThrowsTypeInfo *value = new ThrowsTypeInfo;
value->throws_type_index_ = get_u2be(p);
return value;
}
u2 throws_type_index_;
};
static TargetInfo *ReadTargetInfo(const u1 *&p, u1 target_type) {
switch (target_type) {
case CLASS_TYPE_PARAMETER:
case METHOD_TYPE_PARAMETER:
return TypeParameterTargetInfo::Read(p);
case CLASS_EXTENDS:
return ClassExtendsInfo::Read(p);
case CLASS_TYPE_PARAMETER_BOUND:
case METHOD_TYPE_PARAMETER_BOUND:
return TypeParameterBoundInfo::Read(p);
case FIELD:
case METHOD_RETURN:
case METHOD_RECEIVER:
return new EmptyInfo;
case METHOD_FORMAL_PARAMETER:
return MethodFormalParameterInfo::Read(p);
case THROWS:
return ThrowsTypeInfo::Read(p);
default:
fprintf(stderr, "Illegal type annotation target type: %d\n",
target_type);
abort();
}
}
struct TypePath {
void Write(u1 *&p) {
put_u1(p, path_.size());
for (TypePathEntry entry : path_) {
put_u1(p, entry.type_path_kind_);
put_u1(p, entry.type_argument_index_);
}
}
static TypePath *Read(const u1 *&p) {
TypePath *value = new TypePath;
u1 path_length = get_u1(p);
for (int ii = 0; ii < path_length; ++ii) {
TypePathEntry entry;
entry.type_path_kind_ = get_u1(p);
entry.type_argument_index_ = get_u1(p);
value->path_.push_back(entry);
}
return value;
}
struct TypePathEntry {
u1 type_path_kind_;
u1 type_argument_index_;
};
std::vector<TypePathEntry> path_;
};
u1 target_type_;
TargetInfo *target_info_;
TypePath *type_path_;
Annotation *annotation_;
};
struct AnnotationTypeElementValue : ElementValue {
virtual ~AnnotationTypeElementValue() {
delete annotation_;
}
void Write(u1 *&p) {
put_u1(p, tag_);
annotation_->Write(p);
}
static AnnotationTypeElementValue *Read(const u1 *&p) {
AnnotationTypeElementValue *value = new AnnotationTypeElementValue;
value->annotation_ = Annotation::Read(p);
return value;
}
Annotation *annotation_;
};
ElementValue* ElementValue::Read(const u1 *&p) {
const u1* start = p;
ElementValue *result;
u1 tag = get_u1(p);
if (tag != 0 && strchr("BCDFIJSZs", (char) tag) != NULL) {
result = BaseTypeElementValue::Read(p);
} else if ((char) tag == 'e') {
result = EnumTypeElementValue::Read(p);
} else if ((char) tag == 'c') {
result = ClassTypeElementValue::Read(p);
} else if ((char) tag == '[') {
result = ArrayTypeElementValue::Read(p);
} else if ((char) tag == '@') {
result = AnnotationTypeElementValue::Read(p);
} else {
fprintf(stderr, "Illegal element_value::tag: %d\n", tag);
abort();
}
result->tag_ = tag;
result->length_ = p - start;
return result;
}
// See sec.4.7.20 of JVM spec.
// We preserve AnnotationDefault attributes because they are required
// in order to make use of an annotation in new code.
struct AnnotationDefaultAttribute : Attribute {
virtual ~AnnotationDefaultAttribute() {
delete default_value_;
}
static AnnotationDefaultAttribute* Read(const u1 *&p,
Constant *attribute_name) {
AnnotationDefaultAttribute *attr = new AnnotationDefaultAttribute;
attr->attribute_name_ = attribute_name;
attr->default_value_ = ElementValue::Read(p);
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, default_value_->length_);
default_value_->Write(p);
}
virtual void ExtractClassNames() {
default_value_->ExtractClassNames();
}
ElementValue *default_value_;
};
// See sec.4.7.2 of JVM spec.
// We preserve ConstantValue attributes because they are required for
// compile-time constant propagation.
struct ConstantValueAttribute : Attribute {
static ConstantValueAttribute* Read(const u1 *&p, Constant *attribute_name) {
ConstantValueAttribute *attr = new ConstantValueAttribute;
attr->attribute_name_ = attribute_name;
attr->constantvalue_ = constant(get_u2be(p));
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, 2);
put_u2be(p, constantvalue_->slot());
}
Constant *constantvalue_;
};
// See sec.4.7.9 of JVM spec.
// We preserve Signature attributes because they are required by the
// compiler for type-checking of generics.
struct SignatureAttribute : Attribute {
static SignatureAttribute* Read(const u1 *&p, Constant *attribute_name) {
SignatureAttribute *attr = new SignatureAttribute;
attr->attribute_name_ = attribute_name;
attr->signature_ = constant(get_u2be(p));
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, 2);
put_u2be(p, signature_->slot());
}
virtual void ExtractClassNames() {
size_t signature_idx = 0;
devtools_ijar::ExtractClassNames(signature_->Display(), &signature_idx);
}
Constant *signature_;
};
// See sec.4.7.15 of JVM spec.
// We preserve Deprecated attributes because they are required by the
// compiler to generate warning messages.
struct DeprecatedAttribute : Attribute {
static DeprecatedAttribute *Read(const u1 *& /*p*/,
Constant *attribute_name) {
DeprecatedAttribute *attr = new DeprecatedAttribute;
attr->attribute_name_ = attribute_name;
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, 0);
}
};
// See sec.4.7.16-17 of JVM spec v3. Includes RuntimeVisible and
// RuntimeInvisible.
//
// We preserve all annotations.
struct AnnotationsAttribute : Attribute {
virtual ~AnnotationsAttribute() {
for (size_t i = 0; i < annotations_.size(); i++) {
delete annotations_[i];
}
}
static AnnotationsAttribute* Read(const u1 *&p, Constant *attribute_name) {
AnnotationsAttribute *attr = new AnnotationsAttribute;
attr->attribute_name_ = attribute_name;
u2 num_annotations = get_u2be(p);
for (int ii = 0; ii < num_annotations; ++ii) {
Annotation *annotation = Annotation::Read(p);
attr->annotations_.push_back(annotation);
}
return attr;
}
virtual void ExtractClassNames() {
for (auto *annotation : annotations_) {
annotation->ExtractClassNames();
}
}
virtual bool KeepForCompile() const {
for (auto *annotation : annotations_) {
if (annotation->type_->Display() == "Lkotlin/Metadata;") {
return true;
}
}
return false;
}
void Write(u1 *&p) {
WriteProlog(p, -1);
u1 *payload_start = p - 4;
put_u2be(p, annotations_.size());
for (auto *annotation : annotations_) {
annotation->Write(p);
}
put_u4be(payload_start, p - 4 - payload_start); // backpatch length
}
std::vector<Annotation*> annotations_;
};
// See sec.4.7.18-19 of JVM spec. Includes RuntimeVisible and
// RuntimeInvisible.
//
// We preserve all annotations.
struct ParameterAnnotationsAttribute : Attribute {
static ParameterAnnotationsAttribute* Read(const u1 *&p,
Constant *attribute_name) {
ParameterAnnotationsAttribute *attr = new ParameterAnnotationsAttribute;
attr->attribute_name_ = attribute_name;
u1 num_parameters = get_u1(p);
for (int ii = 0; ii < num_parameters; ++ii) {
std::vector<Annotation*> annotations;
u2 num_annotations = get_u2be(p);
for (int ii = 0; ii < num_annotations; ++ii) {
Annotation *annotation = Annotation::Read(p);
annotations.push_back(annotation);
}
attr->parameter_annotations_.push_back(annotations);
}
return attr;
}
virtual void ExtractClassNames() {
for (size_t i = 0; i < parameter_annotations_.size(); i++) {
const std::vector<Annotation*>& annotations = parameter_annotations_[i];
for (size_t j = 0; j < annotations.size(); j++) {
annotations[j]->ExtractClassNames();
}
}
}
void Write(u1 *&p) {
WriteProlog(p, -1);
u1 *payload_start = p - 4;
put_u1(p, parameter_annotations_.size());
for (size_t ii = 0; ii < parameter_annotations_.size(); ++ii) {
std::vector<Annotation *> &annotations = parameter_annotations_[ii];
put_u2be(p, annotations.size());
for (size_t jj = 0; jj < annotations.size(); ++jj) {
annotations[jj]->Write(p);
}
}
put_u4be(payload_start, p - 4 - payload_start); // backpatch length
}
std::vector<std::vector<Annotation*> > parameter_annotations_;
};
// See sec.4.7.20 of Java 8 JVM spec. Includes RuntimeVisibleTypeAnnotations
// and RuntimeInvisibleTypeAnnotations.
struct TypeAnnotationsAttribute : Attribute {
static TypeAnnotationsAttribute *Read(const u1 *&p, Constant *attribute_name,
u4 /*attribute_length*/) {
auto attr = new TypeAnnotationsAttribute;
attr->attribute_name_ = attribute_name;
u2 num_annotations = get_u2be(p);
for (int ii = 0; ii < num_annotations; ++ii) {
TypeAnnotation *annotation = TypeAnnotation::Read(p);
attr->type_annotations_.push_back(annotation);
}
return attr;
}
virtual void ExtractClassNames() {
for (auto *type_annotation : type_annotations_) {
type_annotation->ExtractClassNames();
}
}
void Write(u1 *&p) {
WriteProlog(p, -1);
u1 *payload_start = p - 4;
put_u2be(p, type_annotations_.size());
for (TypeAnnotation *annotation : type_annotations_) {
annotation->Write(p);
}
put_u4be(payload_start, p - 4 - payload_start); // backpatch length
}
std::vector<TypeAnnotation*> type_annotations_;
};
// See JVMS §4.7.24
struct MethodParametersAttribute : Attribute {
static MethodParametersAttribute *Read(const u1 *&p, Constant *attribute_name,
u4 /*attribute_length*/) {
auto attr = new MethodParametersAttribute;
attr->attribute_name_ = attribute_name;
u1 parameters_count = get_u1(p);
for (int ii = 0; ii < parameters_count; ++ii) {
MethodParameter* parameter = new MethodParameter;
int name_id = get_u2be(p);
parameter->name_ = name_id == 0 ? NULL : constant(name_id);
parameter->access_flags_ = get_u2be(p);
attr->parameters_.push_back(parameter);
}
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, -1);
u1 *payload_start = p - 4;
put_u1(p, parameters_.size());
for (MethodParameter* parameter : parameters_) {
put_u2be(p, parameter->name_ == NULL ? 0 : parameter->name_->slot());
put_u2be(p, parameter->access_flags_);
}
put_u4be(payload_start, p - 4 - payload_start); // backpatch length
}
struct MethodParameter {
Constant *name_;
u2 access_flags_;
};
std::vector<MethodParameter*> parameters_;
};
// See JVMS §4.7.28
struct NestHostAttribute : Attribute {
static NestHostAttribute *Read(const u1 *&p, Constant *attribute_name,
u4 /*attribute_length*/) {
auto attr = new NestHostAttribute;
attr->attribute_name_ = attribute_name;
attr->host_class_index_ = constant(get_u2be(p));
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, 2);
put_u2be(p, host_class_index_->slot());
}
Constant *host_class_index_;
};
// See JVMS §4.7.29
struct NestMembersAttribute : Attribute {
static NestMembersAttribute *Read(const u1 *&p, Constant *attribute_name,
u4 /*attribute_length*/) {
auto attr = new NestMembersAttribute;
attr->attribute_name_ = attribute_name;
u2 number_of_classes = get_u2be(p);
for (int ii = 0; ii < number_of_classes; ++ii) {
attr->classes_.push_back(constant(get_u2be(p)));
}
return attr;
}
void Write(u1 *&p) {
std::set<int> kept_entries;
for (size_t ii = 0; ii < classes_.size(); ++ii) {
Constant *class_ = classes_[ii];
if (class_->Kept() || (used_class_names.find(class_->Display()) !=
used_class_names.end())) {
kept_entries.insert(ii);
}
}
if (kept_entries.empty()) {
return;
}
WriteProlog(p, kept_entries.size() * 2 + 2);
put_u2be(p, kept_entries.size());
for (std::set<int>::iterator it = kept_entries.begin();
it != kept_entries.end(); ++it) {
put_u2be(p, classes_[*it]->slot());
}
}
std::vector<Constant *> classes_;
};
// See JVMS §4.7.30
struct RecordAttribute : Attribute {
static RecordAttribute *Read(const u1 *&p, Constant *attribute_name,
u4 attribute_length) {
auto attr = new RecordAttribute;
attr->attribute_name_ = attribute_name;
attr->attribute_length_ = attribute_length;
u2 components_length = get_u2be(p);
for (int i = 0; i < components_length; ++i) {
attr->components_.push_back(RecordComponentInfo::Read(p));
}
return attr;
}
void Write(u1 *&p) {
u1 *tmp = new u1[attribute_length_];
u1 *start = tmp;
put_u2be(tmp, components_.size());
for (size_t i = 0; i < components_.size(); ++i) {
components_[i]->Write(tmp);
}
u2 length = tmp - start;
WriteProlog(p, length);
memcpy(p, start, length);
p += length;
}
struct RecordComponentInfo : HasAttrs {
void Write(u1 *&p) {
put_u2be(p, name_->slot());
put_u2be(p, descriptor_->slot());
WriteAttrs(p);
}
static RecordComponentInfo *Read(const u1 *&p) {
RecordComponentInfo *value = new RecordComponentInfo;
value->name_ = constant(get_u2be(p));
value->descriptor_ = constant(get_u2be(p));
value->ReadAttrs(p);
return value;
}
Constant *name_;
Constant *descriptor_;
};
u4 attribute_length_;
std::vector<RecordComponentInfo *> components_;
};
// See JVMS §4.7.31
struct PermittedSubclassesAttribute : Attribute {
static PermittedSubclassesAttribute *Read(const u1 *&p,
Constant *attribute_name) {
PermittedSubclassesAttribute *attr = new PermittedSubclassesAttribute;
attr->attribute_name_ = attribute_name;
u2 number_of_exceptions = get_u2be(p);
for (int ii = 0; ii < number_of_exceptions; ++ii) {
attr->permitted_subclasses_.push_back(constant(get_u2be(p)));
}
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, permitted_subclasses_.size() * 2 + 2);
put_u2be(p, permitted_subclasses_.size());
for (size_t ii = 0; ii < permitted_subclasses_.size(); ++ii) {
put_u2be(p, permitted_subclasses_[ii]->slot());
}
}
std::vector<Constant *> permitted_subclasses_;
};
struct GeneralAttribute : Attribute {
static GeneralAttribute* Read(const u1 *&p, Constant *attribute_name,
u4 attribute_length) {
auto attr = new GeneralAttribute;
attr->attribute_name_ = attribute_name;
attr->attribute_length_ = attribute_length;
attr->attribute_content_ = p;
p += attribute_length;
return attr;
}
void Write(u1 *&p) {
WriteProlog(p, attribute_length_);
put_n(p, attribute_content_, attribute_length_);
}
u4 attribute_length_;
const u1 *attribute_content_;
};
/**********************************************************************
* *
* ClassFile *
* *
**********************************************************************/
// A field or method.
// See sec.4.5 and 4.6 of JVM spec.
struct Member : HasAttrs {
u2 access_flags;
Constant *name;
Constant *descriptor;
static Member* Read(const u1 *&p) {
Member *m = new Member;
m->access_flags = get_u2be(p);
m->name = constant(get_u2be(p));
m->descriptor = constant(get_u2be(p));
m->ReadAttrs(p);
return m;
}
void Write(u1 *&p) {
put_u2be(p, access_flags);
put_u2be(p, name->slot());
put_u2be(p, descriptor->slot());
WriteAttrs(p);
}
};
// See sec.4.1 of JVM spec.
struct ClassFile : HasAttrs {
size_t length;
// Header:
u4 magic;
u2 major;
u2 minor;
// Body:
u2 access_flags;
Constant *this_class;
Constant *super_class;
std::vector<Constant*> interfaces;
std::vector<Member*> fields;
std::vector<Member*> methods;
virtual ~ClassFile() {
for (size_t i = 0; i < fields.size(); i++) {
delete fields[i];
}
for (size_t i = 0; i < methods.size(); i++) {
delete methods[i];
}
// Constants do not need to be deleted; they are owned by the constant pool.
}
void WriteClass(u1 *&p);
bool ReadConstantPool(const u1 *&p);
bool KeepForCompile();
bool IsLocalOrAnonymous();
void WriteHeader(u1 *&p) {
put_u4be(p, magic);
put_u2be(p, major);
put_u2be(p, minor);
put_u2be(p, const_pool_out.size());
for (u2 ii = 1; ii < const_pool_out.size(); ++ii) {
if (const_pool_out[ii] != NULL) { // NB: NULLs appear after long/double.
const_pool_out[ii]->Write(p);
}
}
}
void WriteBody(u1 *&p) {
put_u2be(p, access_flags);
put_u2be(p, this_class->slot());
put_u2be(p, super_class == NULL ? 0 : super_class->slot());
put_u2be(p, interfaces.size());
for (size_t ii = 0; ii < interfaces.size(); ++ii) {
put_u2be(p, interfaces[ii]->slot());
}
put_u2be(p, fields.size());
for (size_t ii = 0; ii < fields.size(); ++ii) {
fields[ii]->Write(p);
}
put_u2be(p, methods.size());
for (size_t ii = 0; ii < methods.size(); ++ii) {
methods[ii]->Write(p);
}
Attribute* inner_classes = NULL;
// Make the inner classes attribute the last, so that it can know which
// constants were needed
for (size_t ii = 0; ii < attributes.size(); ii++) {
if (attributes[ii]->attribute_name_->Display() == "InnerClasses") {
inner_classes = attributes[ii];
attributes.erase(attributes.begin() + ii);
break;
}
}
if (inner_classes != NULL) {
attributes.push_back(inner_classes);
}
Attribute* nest_members = NULL;
for (size_t ii = 0; ii < attributes.size(); ii++) {
if (attributes[ii]->attribute_name_->Display() == "NestMembers") {
nest_members = attributes[ii];
attributes.erase(attributes.begin() + ii);
break;
}
}
if (nest_members != NULL) {
attributes.push_back(nest_members);
}
WriteAttrs(p);
}
};
void HasAttrs::ReadAttrs(const u1 *&p) {
u2 attributes_count = get_u2be(p);
for (int ii = 0; ii < attributes_count; ii++) {
Constant *attribute_name = constant(get_u2be(p));
u4 attribute_length = get_u4be(p);
std::string attr_name = attribute_name->Display();
if (attr_name == "SourceFile" ||
attr_name == "StackMapTable" ||
attr_name == "LineNumberTable" ||
attr_name == "LocalVariableTable" ||
attr_name == "LocalVariableTypeTable" ||
attr_name == "Code" ||
attr_name == "Synthetic" ||
attr_name == "BootstrapMethods" ||
attr_name == "SourceDebugExtension") {
p += attribute_length; // drop these attributes
} else if (attr_name == "Exceptions") {
attributes.push_back(ExceptionsAttribute::Read(p, attribute_name));
} else if (attr_name == "Signature") {
attributes.push_back(SignatureAttribute::Read(p, attribute_name));
} else if (attr_name == "Deprecated") {
attributes.push_back(DeprecatedAttribute::Read(p, attribute_name));
} else if (attr_name == "EnclosingMethod") {
attributes.push_back(EnclosingMethodAttribute::Read(p, attribute_name));
} else if (attr_name == "InnerClasses") {
// TODO(bazel-team): omit private inner classes
attributes.push_back(InnerClassesAttribute::Read(p, attribute_name));
} else if (attr_name == "AnnotationDefault") {
attributes.push_back(AnnotationDefaultAttribute::Read(p, attribute_name));
} else if (attr_name == "ConstantValue") {
attributes.push_back(ConstantValueAttribute::Read(p, attribute_name));
} else if (attr_name == "RuntimeVisibleAnnotations" ||
attr_name == "RuntimeInvisibleAnnotations") {
attributes.push_back(AnnotationsAttribute::Read(p, attribute_name));
} else if (attr_name == "RuntimeVisibleParameterAnnotations" ||
attr_name == "RuntimeInvisibleParameterAnnotations") {
attributes.push_back(
ParameterAnnotationsAttribute::Read(p, attribute_name));
} else if (attr_name == "Scala" ||
attr_name == "ScalaSig" ||
attr_name == "ScalaInlineInfo" ||
attr_name == "TurbineTransitiveJar") {
// These are opaque blobs, so can be handled with a general
// attribute handler
attributes.push_back(GeneralAttribute::Read(p, attribute_name,
attribute_length));
} else if (attr_name == "RuntimeVisibleTypeAnnotations" ||
attr_name == "RuntimeInvisibleTypeAnnotations") {
attributes.push_back(TypeAnnotationsAttribute::Read(p, attribute_name,
attribute_length));
} else if (attr_name == "MethodParameters") {
attributes.push_back(
MethodParametersAttribute::Read(p, attribute_name, attribute_length));
} else if (attr_name == "NestHost") {
attributes.push_back(
NestHostAttribute::Read(p, attribute_name, attribute_length));
} else if (attr_name == "NestMembers") {
attributes.push_back(
NestMembersAttribute::Read(p, attribute_name, attribute_length));
} else if (attr_name == "Record") {
attributes.push_back(
RecordAttribute::Read(p, attribute_name, attribute_length));
} else if (attr_name == "PermittedSubclasses") {
attributes.push_back(
PermittedSubclassesAttribute::Read(p, attribute_name));
} else {
// Skip over unknown attributes with a warning. The JVM spec
// says this is ok, so long as we handle the mandatory attributes.
// Don't even warn for the D8 desugar SynthesizedClass attribute. It is
// not relevant for ijar.
if (attr_name != "com.android.tools.r8.SynthesizedClass" &&
attr_name != "com.android.tools.r8.SynthesizedClassV2") {
// Only warn about the first occurrence of each unknown attribute.
if (unknown_attributes.insert(attr_name).second) {
fprintf(stderr, "ijar: skipping unknown attribute: \"%s\".\n",
attr_name.c_str());
}
}
p += attribute_length;
}
}
}
void HasAttrs::WriteAttrs(u1 *&p) {
u1* p_size = p;
put_u2be(p, 0);
int n_written_attrs = 0;
for (size_t ii = 0; ii < attributes.size(); ii++) {
u1* before = p;
attributes[ii]->Write(p);
if (p != before) {
n_written_attrs++;
}
}
put_u2be(p_size, n_written_attrs);
}
// See sec.4.4 of JVM spec.
bool ClassFile::ReadConstantPool(const u1 *&p) {
const_pool_in.clear();
const_pool_in.push_back(NULL); // dummy first item
u2 cp_count = get_u2be(p);
for (int ii = 1; ii < cp_count; ++ii) {
u1 tag = get_u1(p);
if (devtools_ijar::verbose) {
fprintf(stderr, "cp[%d/%d] = tag %d\n", ii, cp_count, tag);
}
switch(tag) {
case CONSTANT_Class: {
u2 name_index = get_u2be(p);
const_pool_in.push_back(new Constant_Class(name_index));
break;
}
case CONSTANT_FieldRef:
case CONSTANT_Methodref:
case CONSTANT_Interfacemethodref: {
u2 class_index = get_u2be(p);
u2 nti = get_u2be(p);
const_pool_in.push_back(new Constant_FMIref(tag, class_index, nti));
break;
}
case CONSTANT_String: {
u2 string_index = get_u2be(p);
const_pool_in.push_back(new Constant_String(string_index));
break;
}
case CONSTANT_NameAndType: {
u2 name_index = get_u2be(p);
u2 descriptor_index = get_u2be(p);
const_pool_in.push_back(
new Constant_NameAndType(name_index, descriptor_index));
break;
}
case CONSTANT_Utf8: {
u2 length = get_u2be(p);
if (devtools_ijar::verbose) {
fprintf(stderr, "Utf8: \"%s\" (%d)\n",
std::string((const char*) p, length).c_str(), length);
}
const_pool_in.push_back(new Constant_Utf8(length, p));
p += length;
break;
}
case CONSTANT_Integer:
case CONSTANT_Float: {
u4 bytes = get_u4be(p);
const_pool_in.push_back(new Constant_IntegerOrFloat(tag, bytes));
break;
}
case CONSTANT_Long:
case CONSTANT_Double: {
u4 high_bytes = get_u4be(p);
u4 low_bytes = get_u4be(p);
const_pool_in.push_back(
new Constant_LongOrDouble(tag, high_bytes, low_bytes));
// Longs and doubles occupy two constant pool slots.
// ("In retrospect, making 8-byte constants take two "constant
// pool entries was a poor choice." --JVM Spec.)
const_pool_in.push_back(NULL);
ii++;
break;
}
case CONSTANT_MethodHandle: {
u1 reference_kind = get_u1(p);
u2 reference_index = get_u2be(p);
const_pool_in.push_back(
new Constant_MethodHandle(reference_kind, reference_index));
break;
}
case CONSTANT_MethodType: {
u2 descriptor_index = get_u2be(p);
const_pool_in.push_back(new Constant_MethodType(descriptor_index));
break;
}
case CONSTANT_Dynamic: {
u2 bootstrap_method_attr = get_u2be(p);
u2 name_name_type_index = get_u2be(p);
const_pool_in.push_back(
new Constant_Dynamic(bootstrap_method_attr, name_name_type_index));
break;
}
case CONSTANT_InvokeDynamic: {
u2 bootstrap_method_attr = get_u2be(p);
u2 name_name_type_index = get_u2be(p);
const_pool_in.push_back(new Constant_InvokeDynamic(
bootstrap_method_attr, name_name_type_index));
break;
}
default: {
fprintf(stderr, "Unknown constant: %hhu. Passing class through.\n",
tag);
return false;
}
}
}
return true;
}
bool ClassFile::IsLocalOrAnonymous() {
for (const Attribute *attribute : attributes) {
if (attribute->attribute_name_->Display() == "EnclosingMethod") {
// JVMS 4.7.6: a class must has EnclosingMethod attribute iff it
// represents a local class or an anonymous class
return true;
}
}
return false;
}
static bool HasKeepForCompile(const std::vector<Attribute *> attributes) {
for (const Attribute *attribute : attributes) {
if (attribute->KeepForCompile()) {
return true;
}
}
return false;
}
bool ClassFile::KeepForCompile() {
if (HasKeepForCompile(attributes)) {
return true;
}
return false;
}
static ClassFile *ReadClass(const void *classdata, size_t length) {
const u1 *p = (u1*) classdata;
ClassFile *clazz = new ClassFile;
clazz->length = length;
clazz->magic = get_u4be(p);
if (clazz->magic != 0xCAFEBABE) {
fprintf(stderr, "Bad magic %" PRIx32 "\n", clazz->magic);
abort();
}
clazz->major = get_u2be(p);
clazz->minor = get_u2be(p);
if (!clazz->ReadConstantPool(p)) {
delete clazz;
return NULL;
}
clazz->access_flags = get_u2be(p);
clazz->this_class = constant(get_u2be(p));
class_name = clazz->this_class;
u2 super_class_id = get_u2be(p);
clazz->super_class = super_class_id == 0 ? NULL : constant(super_class_id);
u2 interfaces_count = get_u2be(p);
for (int ii = 0; ii < interfaces_count; ++ii) {
clazz->interfaces.push_back(constant(get_u2be(p)));
}
u2 fields_count = get_u2be(p);
for (int ii = 0; ii < fields_count; ++ii) {
Member *field = Member::Read(p);
if ((field->access_flags & ACC_PRIVATE) == ACC_PRIVATE) {
// drop private fields
continue;
}
clazz->fields.push_back(field);
}
u2 methods_count = get_u2be(p);
for (int ii = 0; ii < methods_count; ++ii) {
Member *method = Member::Read(p);
// drop class initializers
if (method->name->Display() == "<clinit>") continue;
if ((method->access_flags & ACC_PRIVATE) == ACC_PRIVATE) {
// drop private methods
continue;
}
if ((method->access_flags & (ACC_SYNTHETIC | ACC_BRIDGE | ACC_PUBLIC |
ACC_PROTECTED)) == ACC_SYNTHETIC) {
// drop package-private non-bridge synthetic methods, e.g. synthetic
// constructors used to instantiate private nested classes within their
// declaring compilation unit
continue;
}
clazz->methods.push_back(method);
}
clazz->ReadAttrs(p);
return clazz;
}
// In theory, '/' is also reserved, but it's okay if we just parse package
// identifiers as part of the class name. Note that signatures are UTF-8, but
// this works just as well as in plain ASCII.
static const char *SIGNATURE_NON_IDENTIFIER_CHARS = ".;[<>:";
void Expect(const std::string& desc, size_t* p, char expected) {
if (desc[*p] != expected) {
fprintf(stderr, "Expected '%c' in '%s' at %zd in signature\n",
expected, desc.substr(*p).c_str(), *p);
exit(1);
}
*p += 1;
}
// These functions form a crude recursive descent parser for descriptors and
// signatures in class files (see JVM spec 4.3).
//
// This parser is a bit more liberal than the spec, but this should be fine,
// because it accepts all valid class files and croaks only on invalid ones.
void ParseFromClassTypeSignature(const std::string& desc, size_t* p);
void ParseSimpleClassTypeSignature(const std::string& desc, size_t* p);
void ParseClassTypeSignatureSuffix(const std::string& desc, size_t* p);
void ParseIdentifier(const std::string& desc, size_t* p);
void ParseTypeArgumentsOpt(const std::string& desc, size_t* p);
void ParseMethodDescriptor(const std::string& desc, size_t* p);
void ParseClassTypeSignature(const std::string& desc, size_t* p) {
Expect(desc, p, 'L');
ParseSimpleClassTypeSignature(desc, p);
ParseClassTypeSignatureSuffix(desc, p);
Expect(desc, p, ';');
}
void ParseSimpleClassTypeSignature(const std::string& desc, size_t* p) {
ParseIdentifier(desc, p);
ParseTypeArgumentsOpt(desc, p);
}
void ParseClassTypeSignatureSuffix(const std::string& desc, size_t* p) {
while (desc[*p] == '.') {
*p += 1;
ParseSimpleClassTypeSignature(desc, p);
}
}
void ParseIdentifier(const std::string& desc, size_t* p) {
size_t next = desc.find_first_of(SIGNATURE_NON_IDENTIFIER_CHARS, *p);
std::string id = desc.substr(*p, next - *p);
used_class_names.insert(id);
*p = next;
}
void ParseTypeArgumentsOpt(const std::string& desc, size_t* p) {
if (desc[*p] != '<') {
return;
}
*p += 1;
while (desc[*p] != '>') {
switch (desc[*p]) {
case '*':
*p += 1;
break;
case '+':
case '-':
*p += 1;
ExtractClassNames(desc, p);
break;
default:
ExtractClassNames(desc, p);
break;
}
}
*p += 1;
}
void ParseMethodDescriptor(const std::string& desc, size_t* p) {
Expect(desc, p, '(');
while (desc[*p] != ')') {
ExtractClassNames(desc, p);
}
Expect(desc, p, ')');
ExtractClassNames(desc, p);
}
void ParseFormalTypeParameters(const std::string& desc, size_t* p) {
Expect(desc, p, '<');
while (desc[*p] != '>') {
ParseIdentifier(desc, p);
Expect(desc, p, ':');
if (desc[*p] != ':' && desc[*p] != '>') {
ExtractClassNames(desc, p);
}
while (desc[*p] == ':') {
Expect(desc, p, ':');
ExtractClassNames(desc, p);
}
}
Expect(desc, p, '>');
}
void ExtractClassNames(const std::string& desc, size_t* p) {
switch (desc[*p]) {
case '<':
ParseFormalTypeParameters(desc, p);
ExtractClassNames(desc, p);
break;
case 'L':
ParseClassTypeSignature(desc, p);
break;
case '[':
*p += 1;
ExtractClassNames(desc, p);
break;
case 'T':
*p += 1;
ParseIdentifier(desc, p);
Expect(desc, p, ';');
break;
case '(':
ParseMethodDescriptor(desc, p);
break;
case 'B':
case 'C':
case 'D':
case 'F':
case 'I':
case 'J':
case 'S':
case 'Z':
case 'V':
*p += 1;
break;
default:
fprintf(stderr, "Invalid signature %s\n", desc.substr(*p).c_str());
}
}
void ClassFile::WriteClass(u1 *&p) {
used_class_names.clear();
std::vector<Member *> members;
members.insert(members.end(), fields.begin(), fields.end());
members.insert(members.end(), methods.begin(), methods.end());
ExtractClassNames();
for (auto *member : members) {
size_t idx = 0;
devtools_ijar::ExtractClassNames(member->descriptor->Display(), &idx);
member->ExtractClassNames();
}
// We have to write the body out before the header in order to reference
// the essential constants and populate the output constant pool:
u1 *body = new u1[length];
u1 *q = body;
WriteBody(q); // advances q
u4 body_length = q - body;
WriteHeader(p); // advances p
put_n(p, body, body_length);
delete[] body;
}
bool StripClass(u1 *&classdata_out, const u1 *classdata_in, size_t in_length) {
ClassFile *clazz = ReadClass(classdata_in, in_length);
bool keep = true;
if (clazz == NULL || clazz->KeepForCompile()) {
// Class is invalid or kept. Simply copy it to the output and call it a day.
put_n(classdata_out, classdata_in, in_length);
} else if (clazz->IsLocalOrAnonymous()) {
keep = false;
} else {
// Constant pool item zero is a dummy entry. Setting it marks the
// beginning of the output phase; calls to Constant::slot() will
// fail if called prior to this.
const_pool_out.push_back(NULL);
clazz->WriteClass(classdata_out);
delete clazz;
}
// Now clean up all the mess we left behind.
for (size_t i = 0; i < const_pool_in.size(); i++) {
delete const_pool_in[i];
}
const_pool_in.clear();
const_pool_out.clear();
return keep;
}
} // namespace devtools_ijar