diff options
Diffstat (limited to 'runtime/jni/local_reference_table.h')
-rw-r--r-- | runtime/jni/local_reference_table.h | 396 |
1 files changed, 396 insertions, 0 deletions
diff --git a/runtime/jni/local_reference_table.h b/runtime/jni/local_reference_table.h new file mode 100644 index 0000000000..debaa8b97a --- /dev/null +++ b/runtime/jni/local_reference_table.h @@ -0,0 +1,396 @@ +/* + * Copyright (C) 2022 The Android Open Source Project + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +#ifndef ART_RUNTIME_JNI_LOCAL_REFERENCE_TABLE_H_ +#define ART_RUNTIME_JNI_LOCAL_REFERENCE_TABLE_H_ + +#include <stdint.h> + +#include <iosfwd> +#include <limits> +#include <string> + +#include <android-base/logging.h> + +#include "base/bit_utils.h" +#include "base/locks.h" +#include "base/macros.h" +#include "base/mem_map.h" +#include "base/mutex.h" +#include "gc_root.h" +#include "indirect_reference_table.h" +#include "obj_ptr.h" +#include "offsets.h" +#include "read_barrier_option.h" + +namespace art { + +class RootInfo; + +namespace mirror { +class Object; +} // namespace mirror + +namespace jni { + +// Maintain a table of local references. Used for local JNI references. +// TODO: Rewrite the implementation, so that valid local references are effectively +// `CompressedReference<Object>*`, so that it can be decoded very quickly. +// +// The table contains object references, where the strong (local/global) references are part of the +// GC root set (but not the weak global references). When an object is added we return an +// IndirectRef that is not a valid pointer but can be used to find the original value in O(1) time. +// Conversions to and from indirect references are performed on upcalls and downcalls, so they need +// to be very fast. +// +// To be efficient for JNI local variable storage, we need to provide operations that allow us to +// operate on segments of the table, where segments are pushed and popped as if on a stack. For +// example, deletion of an entry should only succeed if it appears in the current segment, and we +// want to be able to strip off the current segment quickly when a method returns. Additions to the +// table must be made in the current segment even if space is available in an earlier area. +// +// A new segment is created when we call into native code from interpreted code, or when we handle +// the JNI PushLocalFrame function. +// +// The GC must be able to scan the entire table quickly. +// +// In summary, these must be very fast: +// - adding or removing a segment +// - adding references to a new segment +// - converting an indirect reference back to an Object +// These can be a little slower, but must still be pretty quick: +// - adding references to a "mature" segment +// - removing individual references +// - scanning the entire table straight through +// +// If there's more than one segment, we don't guarantee that the table will fill completely before +// we fail due to lack of space. We do ensure that the current segment will pack tightly, which +// should satisfy JNI requirements (e.g. EnsureLocalCapacity). + +// Indirect reference definition. This must be interchangeable with JNI's jobject, and it's +// convenient to let null be null, so we use void*. +// +// We need a (potentially) large table index and a 2-bit reference type (global, local, weak +// global). We also reserve some bits to be used to detect stale indirect references: we put a +// serial number in the extra bits, and keep a copy of the serial number in the table. This requires +// more memory and additional memory accesses on add/get, but is moving-GC safe. It will catch +// additional problems, e.g.: create iref1 for obj, delete iref1, create iref2 for same obj, +// lookup iref1. A pattern based on object bits will miss this. + +// Table definition. +// +// For the global reference table, the expected common operations are adding a new entry and +// removing a recently-added entry (usually the most-recently-added entry). For JNI local +// references, the common operations are adding a new entry and removing an entire table segment. +// +// If we delete entries from the middle of the list, we will be left with "holes". We track the +// number of holes so that, when adding new elements, we can quickly decide to do a trivial append +// or go slot-hunting. +// +// When the top-most entry is removed, any holes immediately below it are also removed. Thus, +// deletion of an entry may reduce "top_index" by more than one. +// +// To get the desired behavior for JNI locals, we need to know the bottom and top of the current +// "segment". The top is managed internally, and the bottom is passed in as a function argument. +// When we call a native method or push a local frame, the current top index gets pushed on, and +// serves as the new bottom. When we pop a frame off, the value from the stack becomes the new top +// index, and the value stored in the previous frame becomes the new bottom. +// +// Holes are being locally cached for the segment. Otherwise we'd have to pass bottom index and +// number of holes, which restricts us to 16 bits for the top index. The value is cached within the +// table. To avoid code in generated JNI transitions, which implicitly form segments, the code for +// adding and removing references needs to detect the change of a segment. Helper fields are used +// for this detection. +// +// Common alternative implementation: make IndirectRef a pointer to the actual reference slot. +// Instead of getting a table and doing a lookup, the lookup can be done instantly. Operations like +// determining the type and deleting the reference are more expensive because the table must be +// hunted for (i.e. you have to do a pointer comparison to see which table it's in), you can't move +// the table when expanding it (so realloc() is out), and tricks like serial number checking to +// detect stale references aren't possible (though we may be able to get similar benefits with other +// approaches). +// +// TODO: consider a "lastDeleteIndex" for quick hole-filling when an add immediately follows a +// delete; must invalidate after segment pop might be worth only using it for JNI globals. +// +// TODO: may want completely different add/remove algorithms for global and local refs to improve +// performance. A large circular buffer might reduce the amortized cost of adding global +// references. + +// The state of the current segment. We only store the index. Splitting it for index and hole +// count restricts the range too much. +struct LRTSegmentState { + uint32_t top_index; +}; + +// Use as initial value for "cookie", and when table has only one segment. +static constexpr LRTSegmentState kLRTFirstSegment = { 0 }; + +// We associate a few bits of serial number with each reference, for error checking. +static constexpr unsigned int kLRTSerialBits = 3; +static constexpr uint32_t kLRTMaxSerial = ((1 << kLRTSerialBits) - 1); + +class LrtEntry { + public: + void Add(ObjPtr<mirror::Object> obj) REQUIRES_SHARED(Locks::mutator_lock_); + + GcRoot<mirror::Object>* GetReference() { + DCHECK_LE(serial_, kLRTMaxSerial); + return &reference_; + } + + const GcRoot<mirror::Object>* GetReference() const { + DCHECK_LE(serial_, kLRTMaxSerial); + return &reference_; + } + + uint32_t GetSerial() const { + return serial_; + } + + void SetReference(ObjPtr<mirror::Object> obj) REQUIRES_SHARED(Locks::mutator_lock_); + + private: + uint32_t serial_; // Incremented for each reuse; checked against reference. + GcRoot<mirror::Object> reference_; +}; +static_assert(sizeof(LrtEntry) == 2 * sizeof(uint32_t), "Unexpected sizeof(LrtEntry)"); +static_assert(IsPowerOfTwo(sizeof(LrtEntry)), "Unexpected sizeof(LrtEntry)"); + +// We initially allocate local reference tables with a very small number of entries, packing +// multiple tables into a single page. If we need to expand one, we allocate them in units of +// pages. +// TODO: We should allocate all LRT tables as nonmovable Java objects, That in turn works better +// if we break up each table into 2 parallel arrays, one for the Java reference, and one for the +// serial number. The current scheme page-aligns regions containing LRT tables, and so allows them +// to be identified and page-protected in the future. +constexpr size_t kInitialLrtBytes = 512; // Number of bytes in an initial local table. +constexpr size_t kSmallLrtEntries = kInitialLrtBytes / sizeof(LrtEntry); +static_assert(kPageSize % kInitialLrtBytes == 0); +static_assert(kInitialLrtBytes % sizeof(LrtEntry) == 0); +static_assert(kInitialLrtBytes % sizeof(void *) == 0); + +// A minimal stopgap allocator for initial small local LRT tables. +class SmallLrtAllocator { + public: + SmallLrtAllocator(); + + // Allocate a LRT table for kSmallLrtEntries. + LrtEntry* Allocate(std::string* error_msg) REQUIRES(!lock_); + + void Deallocate(LrtEntry* unneeded) REQUIRES(!lock_); + + private: + // A free list of kInitialLrtBytes chunks linked through the first word. + LrtEntry* small_lrt_freelist_; + + // Repository of MemMaps used for small LRT tables. + std::vector<MemMap> shared_lrt_maps_; + + Mutex lock_; // Level kGenericBottomLock; acquired before mem_map_lock_, which is a C++ mutex. +}; + +class LocalReferenceTable { + public: + // Constructs an uninitialized indirect reference table. Use `Initialize()` to initialize it. + LocalReferenceTable(); + + // Initialize the indirect reference table. + // + // Max_count is the minimum initial capacity (resizable). + // A value of 1 indicates an implementation-convenient small size. + bool Initialize(size_t max_count, std::string* error_msg); + + ~LocalReferenceTable(); + + /* + * Checks whether construction of the LocalReferenceTable succeeded. + * + * This object must only be used if IsValid() returns true. It is safe to + * call IsValid from multiple threads without locking or other explicit + * synchronization. + */ + bool IsValid() const; + + // Add a new entry. "obj" must be a valid non-null object reference. This function will + // return null if an error happened (with an appropriate error message set). + IndirectRef Add(LRTSegmentState previous_state, + ObjPtr<mirror::Object> obj, + std::string* error_msg) + REQUIRES_SHARED(Locks::mutator_lock_); + + // Given an IndirectRef in the table, return the Object it refers to. + // + // This function may abort under error conditions. + template<ReadBarrierOption kReadBarrierOption = kWithReadBarrier> + ObjPtr<mirror::Object> Get(IndirectRef iref) const REQUIRES_SHARED(Locks::mutator_lock_) + ALWAYS_INLINE; + + // Updates an existing indirect reference to point to a new object. + void Update(IndirectRef iref, ObjPtr<mirror::Object> obj) REQUIRES_SHARED(Locks::mutator_lock_); + + // Remove an existing entry. + // + // If the entry is not between the current top index and the bottom index + // specified by the cookie, we don't remove anything. This is the behavior + // required by JNI's DeleteLocalRef function. + // + // Returns "false" if nothing was removed. + bool Remove(LRTSegmentState previous_state, IndirectRef iref); + + void AssertEmpty() REQUIRES_SHARED(Locks::mutator_lock_); + + void Dump(std::ostream& os) const + REQUIRES_SHARED(Locks::mutator_lock_) + REQUIRES(!Locks::alloc_tracker_lock_); + + IndirectRefKind GetKind() const { + return kLocal; + } + + // Return the #of entries in the entire table. This includes holes, and + // so may be larger than the actual number of "live" entries. + size_t Capacity() const { + return segment_state_.top_index; + } + + // Return the number of non-null entries in the table. Only reliable for a + // single segment table. + int32_t NEntriesForGlobal() { + return segment_state_.top_index - current_num_holes_; + } + + // Ensure that at least free_capacity elements are available, or return false. + // Caller ensures free_capacity > 0. + bool EnsureFreeCapacity(size_t free_capacity, std::string* error_msg) + REQUIRES_SHARED(Locks::mutator_lock_); + // See implementation of EnsureFreeCapacity. We'll only state here how much is trivially free, + // without recovering holes. Thus this is a conservative estimate. + size_t FreeCapacity() const; + + void VisitRoots(RootVisitor* visitor, const RootInfo& root_info) + REQUIRES_SHARED(Locks::mutator_lock_); + + LRTSegmentState GetSegmentState() const { + return segment_state_; + } + + void SetSegmentState(LRTSegmentState new_state); + + static Offset SegmentStateOffset(size_t pointer_size ATTRIBUTE_UNUSED) { + // Note: Currently segment_state_ is at offset 0. We're testing the expected value in + // jni_internal_test to make sure it stays correct. It is not OFFSETOF_MEMBER, as that + // is not pointer-size-safe. + return Offset(0); + } + + // Release pages past the end of the table that may have previously held references. + void Trim() REQUIRES_SHARED(Locks::mutator_lock_); + + // Determine what kind of indirect reference this is. Opposite of EncodeIndirectRefKind. + ALWAYS_INLINE static inline IndirectRefKind GetIndirectRefKind(IndirectRef iref) { + return DecodeIndirectRefKind(reinterpret_cast<uintptr_t>(iref)); + } + + /* Reference validation for CheckJNI. */ + bool IsValidReference(IndirectRef, /*out*/std::string* error_msg) const + REQUIRES_SHARED(Locks::mutator_lock_); + + private: + static constexpr uint32_t kShiftedSerialMask = (1u << kLRTSerialBits) - 1; + + static constexpr size_t kKindBits = MinimumBitsToStore( + static_cast<uint32_t>(IndirectRefKind::kLastKind)); + static constexpr uint32_t kKindMask = (1u << kKindBits) - 1; + + static constexpr uintptr_t EncodeIndex(uint32_t table_index) { + static_assert(sizeof(IndirectRef) == sizeof(uintptr_t), "Unexpected IndirectRef size"); + DCHECK_LE(MinimumBitsToStore(table_index), BitSizeOf<uintptr_t>() - kLRTSerialBits - kKindBits); + return (static_cast<uintptr_t>(table_index) << kKindBits << kLRTSerialBits); + } + static constexpr uint32_t DecodeIndex(uintptr_t uref) { + return static_cast<uint32_t>((uref >> kKindBits) >> kLRTSerialBits); + } + + static constexpr uintptr_t EncodeIndirectRefKind(IndirectRefKind kind) { + return static_cast<uintptr_t>(kind); + } + static constexpr IndirectRefKind DecodeIndirectRefKind(uintptr_t uref) { + return static_cast<IndirectRefKind>(uref & kKindMask); + } + + static constexpr uintptr_t EncodeSerial(uint32_t serial) { + DCHECK_LE(MinimumBitsToStore(serial), kLRTSerialBits); + return serial << kKindBits; + } + static constexpr uint32_t DecodeSerial(uintptr_t uref) { + return static_cast<uint32_t>(uref >> kKindBits) & kShiftedSerialMask; + } + + constexpr uintptr_t EncodeIndirectRef(uint32_t table_index, uint32_t serial) const { + DCHECK_LT(table_index, max_entries_); + return EncodeIndex(table_index) | EncodeSerial(serial) | EncodeIndirectRefKind(kLocal); + } + + static void ConstexprChecks(); + + // Extract the table index from an indirect reference. + ALWAYS_INLINE static uint32_t ExtractIndex(IndirectRef iref) { + return DecodeIndex(reinterpret_cast<uintptr_t>(iref)); + } + + IndirectRef ToIndirectRef(uint32_t table_index) const { + DCHECK_LT(table_index, max_entries_); + uint32_t serial = table_[table_index].GetSerial(); + return reinterpret_cast<IndirectRef>(EncodeIndirectRef(table_index, serial)); + } + + // Resize the backing table to be at least new_size elements long. Currently + // must be larger than the current size. After return max_entries_ >= new_size. + bool Resize(size_t new_size, std::string* error_msg); + + void RecoverHoles(LRTSegmentState from); + + // Abort if check_jni is not enabled. Otherwise, just log as an error. + static void AbortIfNoCheckJNI(const std::string& msg); + + /* extra debugging checks */ + bool CheckEntry(const char*, IndirectRef, uint32_t) const; + + /// semi-public - read/write by jni down calls. + LRTSegmentState segment_state_; + + // Mem map where we store the indirect refs. If it's invalid, and table_ is non-null, then + // table_ is valid, but was allocated via `SmallLrtAllocator`; + MemMap table_mem_map_; + // bottom of the stack. Do not directly access the object references + // in this as they are roots. Use Get() that has a read barrier. + LrtEntry* table_; + + // max #of entries allowed (modulo resizing). + size_t max_entries_; + + // Some values to retain old behavior with holes. Description of the algorithm is in the .cc + // file. + // TODO: Consider other data structures for compact tables, e.g., free lists. + size_t current_num_holes_; // Number of holes in the current / top segment. + LRTSegmentState last_known_previous_state_; +}; + +} // namespace jni +} // namespace art + +#endif // ART_RUNTIME_JNI_LOCAL_REFERENCE_TABLE_H_ |