• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright 2014 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 #include "jit_code_cache.h"
18 
19 #include <sstream>
20 
21 #include "art_method-inl.h"
22 #include "base/stl_util.h"
23 #include "base/systrace.h"
24 #include "base/time_utils.h"
25 #include "debugger_interface.h"
26 #include "entrypoints/runtime_asm_entrypoints.h"
27 #include "gc/accounting/bitmap-inl.h"
28 #include "gc/scoped_gc_critical_section.h"
29 #include "jit/jit.h"
30 #include "jit/profiling_info.h"
31 #include "linear_alloc.h"
32 #include "mem_map.h"
33 #include "oat_file-inl.h"
34 #include "scoped_thread_state_change.h"
35 #include "thread_list.h"
36 
37 namespace art {
38 namespace jit {
39 
40 static constexpr int kProtAll = PROT_READ | PROT_WRITE | PROT_EXEC;
41 static constexpr int kProtData = PROT_READ | PROT_WRITE;
42 static constexpr int kProtCode = PROT_READ | PROT_EXEC;
43 
44 static constexpr size_t kCodeSizeLogThreshold = 50 * KB;
45 static constexpr size_t kStackMapSizeLogThreshold = 50 * KB;
46 
47 #define CHECKED_MPROTECT(memory, size, prot)                \
48   do {                                                      \
49     int rc = mprotect(memory, size, prot);                  \
50     if (UNLIKELY(rc != 0)) {                                \
51       errno = rc;                                           \
52       PLOG(FATAL) << "Failed to mprotect jit code cache";   \
53     }                                                       \
54   } while (false)                                           \
55 
Create(size_t initial_capacity,size_t max_capacity,bool generate_debug_info,std::string * error_msg)56 JitCodeCache* JitCodeCache::Create(size_t initial_capacity,
57                                    size_t max_capacity,
58                                    bool generate_debug_info,
59                                    std::string* error_msg) {
60   ScopedTrace trace(__PRETTY_FUNCTION__);
61   CHECK_GE(max_capacity, initial_capacity);
62 
63   // Generating debug information is mostly for using the 'perf' tool, which does
64   // not work with ashmem.
65   bool use_ashmem = !generate_debug_info;
66   // With 'perf', we want a 1-1 mapping between an address and a method.
67   bool garbage_collect_code = !generate_debug_info;
68 
69   // We need to have 32 bit offsets from method headers in code cache which point to things
70   // in the data cache. If the maps are more than 4G apart, having multiple maps wouldn't work.
71   // Ensure we're below 1 GB to be safe.
72   if (max_capacity > 1 * GB) {
73     std::ostringstream oss;
74     oss << "Maxium code cache capacity is limited to 1 GB, "
75         << PrettySize(max_capacity) << " is too big";
76     *error_msg = oss.str();
77     return nullptr;
78   }
79 
80   std::string error_str;
81   // Map name specific for android_os_Debug.cpp accounting.
82   MemMap* data_map = MemMap::MapAnonymous(
83       "data-code-cache", nullptr, max_capacity, kProtAll, false, false, &error_str, use_ashmem);
84   if (data_map == nullptr) {
85     std::ostringstream oss;
86     oss << "Failed to create read write execute cache: " << error_str << " size=" << max_capacity;
87     *error_msg = oss.str();
88     return nullptr;
89   }
90 
91   // Align both capacities to page size, as that's the unit mspaces use.
92   initial_capacity = RoundDown(initial_capacity, 2 * kPageSize);
93   max_capacity = RoundDown(max_capacity, 2 * kPageSize);
94 
95   // Data cache is 1 / 2 of the map.
96   // TODO: Make this variable?
97   size_t data_size = max_capacity / 2;
98   size_t code_size = max_capacity - data_size;
99   DCHECK_EQ(code_size + data_size, max_capacity);
100   uint8_t* divider = data_map->Begin() + data_size;
101 
102   MemMap* code_map =
103       data_map->RemapAtEnd(divider, "jit-code-cache", kProtAll, &error_str, use_ashmem);
104   if (code_map == nullptr) {
105     std::ostringstream oss;
106     oss << "Failed to create read write execute cache: " << error_str << " size=" << max_capacity;
107     *error_msg = oss.str();
108     return nullptr;
109   }
110   DCHECK_EQ(code_map->Begin(), divider);
111   data_size = initial_capacity / 2;
112   code_size = initial_capacity - data_size;
113   DCHECK_EQ(code_size + data_size, initial_capacity);
114   return new JitCodeCache(
115       code_map, data_map, code_size, data_size, max_capacity, garbage_collect_code);
116 }
117 
JitCodeCache(MemMap * code_map,MemMap * data_map,size_t initial_code_capacity,size_t initial_data_capacity,size_t max_capacity,bool garbage_collect_code)118 JitCodeCache::JitCodeCache(MemMap* code_map,
119                            MemMap* data_map,
120                            size_t initial_code_capacity,
121                            size_t initial_data_capacity,
122                            size_t max_capacity,
123                            bool garbage_collect_code)
124     : lock_("Jit code cache", kJitCodeCacheLock),
125       lock_cond_("Jit code cache variable", lock_),
126       collection_in_progress_(false),
127       code_map_(code_map),
128       data_map_(data_map),
129       max_capacity_(max_capacity),
130       current_capacity_(initial_code_capacity + initial_data_capacity),
131       code_end_(initial_code_capacity),
132       data_end_(initial_data_capacity),
133       last_collection_increased_code_cache_(false),
134       last_update_time_ns_(0),
135       garbage_collect_code_(garbage_collect_code),
136       used_memory_for_data_(0),
137       used_memory_for_code_(0),
138       number_of_compilations_(0),
139       number_of_osr_compilations_(0),
140       number_of_deoptimizations_(0),
141       number_of_collections_(0),
142       histogram_stack_map_memory_use_("Memory used for stack maps", 16),
143       histogram_code_memory_use_("Memory used for compiled code", 16),
144       histogram_profiling_info_memory_use_("Memory used for profiling info", 16) {
145 
146   DCHECK_GE(max_capacity, initial_code_capacity + initial_data_capacity);
147   code_mspace_ = create_mspace_with_base(code_map_->Begin(), code_end_, false /*locked*/);
148   data_mspace_ = create_mspace_with_base(data_map_->Begin(), data_end_, false /*locked*/);
149 
150   if (code_mspace_ == nullptr || data_mspace_ == nullptr) {
151     PLOG(FATAL) << "create_mspace_with_base failed";
152   }
153 
154   SetFootprintLimit(current_capacity_);
155 
156   CHECKED_MPROTECT(code_map_->Begin(), code_map_->Size(), kProtCode);
157   CHECKED_MPROTECT(data_map_->Begin(), data_map_->Size(), kProtData);
158 
159   VLOG(jit) << "Created jit code cache: initial data size="
160             << PrettySize(initial_data_capacity)
161             << ", initial code size="
162             << PrettySize(initial_code_capacity);
163 }
164 
ContainsPc(const void * ptr) const165 bool JitCodeCache::ContainsPc(const void* ptr) const {
166   return code_map_->Begin() <= ptr && ptr < code_map_->End();
167 }
168 
ContainsMethod(ArtMethod * method)169 bool JitCodeCache::ContainsMethod(ArtMethod* method) {
170   MutexLock mu(Thread::Current(), lock_);
171   for (auto& it : method_code_map_) {
172     if (it.second == method) {
173       return true;
174     }
175   }
176   return false;
177 }
178 
179 class ScopedCodeCacheWrite : ScopedTrace {
180  public:
ScopedCodeCacheWrite(MemMap * code_map)181   explicit ScopedCodeCacheWrite(MemMap* code_map)
182       : ScopedTrace("ScopedCodeCacheWrite"),
183         code_map_(code_map) {
184     ScopedTrace trace("mprotect all");
185     CHECKED_MPROTECT(code_map_->Begin(), code_map_->Size(), kProtAll);
186   }
~ScopedCodeCacheWrite()187   ~ScopedCodeCacheWrite() {
188     ScopedTrace trace("mprotect code");
189     CHECKED_MPROTECT(code_map_->Begin(), code_map_->Size(), kProtCode);
190   }
191  private:
192   MemMap* const code_map_;
193 
194   DISALLOW_COPY_AND_ASSIGN(ScopedCodeCacheWrite);
195 };
196 
CommitCode(Thread * self,ArtMethod * method,const uint8_t * vmap_table,size_t frame_size_in_bytes,size_t core_spill_mask,size_t fp_spill_mask,const uint8_t * code,size_t code_size,bool osr)197 uint8_t* JitCodeCache::CommitCode(Thread* self,
198                                   ArtMethod* method,
199                                   const uint8_t* vmap_table,
200                                   size_t frame_size_in_bytes,
201                                   size_t core_spill_mask,
202                                   size_t fp_spill_mask,
203                                   const uint8_t* code,
204                                   size_t code_size,
205                                   bool osr) {
206   uint8_t* result = CommitCodeInternal(self,
207                                        method,
208                                        vmap_table,
209                                        frame_size_in_bytes,
210                                        core_spill_mask,
211                                        fp_spill_mask,
212                                        code,
213                                        code_size,
214                                        osr);
215   if (result == nullptr) {
216     // Retry.
217     GarbageCollectCache(self);
218     result = CommitCodeInternal(self,
219                                 method,
220                                 vmap_table,
221                                 frame_size_in_bytes,
222                                 core_spill_mask,
223                                 fp_spill_mask,
224                                 code,
225                                 code_size,
226                                 osr);
227   }
228   return result;
229 }
230 
WaitForPotentialCollectionToComplete(Thread * self)231 bool JitCodeCache::WaitForPotentialCollectionToComplete(Thread* self) {
232   bool in_collection = false;
233   while (collection_in_progress_) {
234     in_collection = true;
235     lock_cond_.Wait(self);
236   }
237   return in_collection;
238 }
239 
FromCodeToAllocation(const void * code)240 static uintptr_t FromCodeToAllocation(const void* code) {
241   size_t alignment = GetInstructionSetAlignment(kRuntimeISA);
242   return reinterpret_cast<uintptr_t>(code) - RoundUp(sizeof(OatQuickMethodHeader), alignment);
243 }
244 
FreeCode(const void * code_ptr,ArtMethod * method ATTRIBUTE_UNUSED)245 void JitCodeCache::FreeCode(const void* code_ptr, ArtMethod* method ATTRIBUTE_UNUSED) {
246   uintptr_t allocation = FromCodeToAllocation(code_ptr);
247   const OatQuickMethodHeader* method_header = OatQuickMethodHeader::FromCodePointer(code_ptr);
248   // Notify native debugger that we are about to remove the code.
249   // It does nothing if we are not using native debugger.
250   DeleteJITCodeEntryForAddress(reinterpret_cast<uintptr_t>(code_ptr));
251 
252   // Use the offset directly to prevent sanity check that the method is
253   // compiled with optimizing.
254   // TODO(ngeoffray): Clean up.
255   if (method_header->vmap_table_offset_ != 0) {
256     const uint8_t* data = method_header->code_ - method_header->vmap_table_offset_;
257     FreeData(const_cast<uint8_t*>(data));
258   }
259   FreeCode(reinterpret_cast<uint8_t*>(allocation));
260 }
261 
RemoveMethodsIn(Thread * self,const LinearAlloc & alloc)262 void JitCodeCache::RemoveMethodsIn(Thread* self, const LinearAlloc& alloc) {
263   ScopedTrace trace(__PRETTY_FUNCTION__);
264   MutexLock mu(self, lock_);
265   // We do not check if a code cache GC is in progress, as this method comes
266   // with the classlinker_classes_lock_ held, and suspending ourselves could
267   // lead to a deadlock.
268   {
269     ScopedCodeCacheWrite scc(code_map_.get());
270     for (auto it = method_code_map_.begin(); it != method_code_map_.end();) {
271       if (alloc.ContainsUnsafe(it->second)) {
272         FreeCode(it->first, it->second);
273         it = method_code_map_.erase(it);
274       } else {
275         ++it;
276       }
277     }
278   }
279   for (auto it = osr_code_map_.begin(); it != osr_code_map_.end();) {
280     if (alloc.ContainsUnsafe(it->first)) {
281       // Note that the code has already been removed in the loop above.
282       it = osr_code_map_.erase(it);
283     } else {
284       ++it;
285     }
286   }
287   for (auto it = profiling_infos_.begin(); it != profiling_infos_.end();) {
288     ProfilingInfo* info = *it;
289     if (alloc.ContainsUnsafe(info->GetMethod())) {
290       info->GetMethod()->SetProfilingInfo(nullptr);
291       FreeData(reinterpret_cast<uint8_t*>(info));
292       it = profiling_infos_.erase(it);
293     } else {
294       ++it;
295     }
296   }
297 }
298 
ClearGcRootsInInlineCaches(Thread * self)299 void JitCodeCache::ClearGcRootsInInlineCaches(Thread* self) {
300   MutexLock mu(self, lock_);
301   for (ProfilingInfo* info : profiling_infos_) {
302     if (!info->IsInUseByCompiler()) {
303       info->ClearGcRootsInInlineCaches();
304     }
305   }
306 }
307 
CommitCodeInternal(Thread * self,ArtMethod * method,const uint8_t * vmap_table,size_t frame_size_in_bytes,size_t core_spill_mask,size_t fp_spill_mask,const uint8_t * code,size_t code_size,bool osr)308 uint8_t* JitCodeCache::CommitCodeInternal(Thread* self,
309                                           ArtMethod* method,
310                                           const uint8_t* vmap_table,
311                                           size_t frame_size_in_bytes,
312                                           size_t core_spill_mask,
313                                           size_t fp_spill_mask,
314                                           const uint8_t* code,
315                                           size_t code_size,
316                                           bool osr) {
317   size_t alignment = GetInstructionSetAlignment(kRuntimeISA);
318   // Ensure the header ends up at expected instruction alignment.
319   size_t header_size = RoundUp(sizeof(OatQuickMethodHeader), alignment);
320   size_t total_size = header_size + code_size;
321 
322   OatQuickMethodHeader* method_header = nullptr;
323   uint8_t* code_ptr = nullptr;
324   uint8_t* memory = nullptr;
325   {
326     ScopedThreadSuspension sts(self, kSuspended);
327     MutexLock mu(self, lock_);
328     WaitForPotentialCollectionToComplete(self);
329     {
330       ScopedCodeCacheWrite scc(code_map_.get());
331       memory = AllocateCode(total_size);
332       if (memory == nullptr) {
333         return nullptr;
334       }
335       code_ptr = memory + header_size;
336 
337       std::copy(code, code + code_size, code_ptr);
338       method_header = OatQuickMethodHeader::FromCodePointer(code_ptr);
339       new (method_header) OatQuickMethodHeader(
340           (vmap_table == nullptr) ? 0 : code_ptr - vmap_table,
341           frame_size_in_bytes,
342           core_spill_mask,
343           fp_spill_mask,
344           code_size);
345     }
346 
347     FlushInstructionCache(reinterpret_cast<char*>(code_ptr),
348                           reinterpret_cast<char*>(code_ptr + code_size));
349     number_of_compilations_++;
350   }
351   // We need to update the entry point in the runnable state for the instrumentation.
352   {
353     MutexLock mu(self, lock_);
354     method_code_map_.Put(code_ptr, method);
355     if (osr) {
356       number_of_osr_compilations_++;
357       osr_code_map_.Put(method, code_ptr);
358     } else {
359       Runtime::Current()->GetInstrumentation()->UpdateMethodsCode(
360           method, method_header->GetEntryPoint());
361     }
362     if (collection_in_progress_) {
363       // We need to update the live bitmap if there is a GC to ensure it sees this new
364       // code.
365       GetLiveBitmap()->AtomicTestAndSet(FromCodeToAllocation(code_ptr));
366     }
367     last_update_time_ns_.StoreRelease(NanoTime());
368     VLOG(jit)
369         << "JIT added (osr=" << std::boolalpha << osr << std::noboolalpha << ") "
370         << PrettyMethod(method) << "@" << method
371         << " ccache_size=" << PrettySize(CodeCacheSizeLocked()) << ": "
372         << " dcache_size=" << PrettySize(DataCacheSizeLocked()) << ": "
373         << reinterpret_cast<const void*>(method_header->GetEntryPoint()) << ","
374         << reinterpret_cast<const void*>(method_header->GetEntryPoint() + method_header->code_size_);
375     histogram_code_memory_use_.AddValue(code_size);
376     if (code_size > kCodeSizeLogThreshold) {
377       LOG(INFO) << "JIT allocated "
378                 << PrettySize(code_size)
379                 << " for compiled code of "
380                 << PrettyMethod(method);
381     }
382   }
383 
384   return reinterpret_cast<uint8_t*>(method_header);
385 }
386 
CodeCacheSize()387 size_t JitCodeCache::CodeCacheSize() {
388   MutexLock mu(Thread::Current(), lock_);
389   return CodeCacheSizeLocked();
390 }
391 
CodeCacheSizeLocked()392 size_t JitCodeCache::CodeCacheSizeLocked() {
393   return used_memory_for_code_;
394 }
395 
DataCacheSize()396 size_t JitCodeCache::DataCacheSize() {
397   MutexLock mu(Thread::Current(), lock_);
398   return DataCacheSizeLocked();
399 }
400 
DataCacheSizeLocked()401 size_t JitCodeCache::DataCacheSizeLocked() {
402   return used_memory_for_data_;
403 }
404 
ClearData(Thread * self,void * data)405 void JitCodeCache::ClearData(Thread* self, void* data) {
406   MutexLock mu(self, lock_);
407   FreeData(reinterpret_cast<uint8_t*>(data));
408 }
409 
ReserveData(Thread * self,size_t size,ArtMethod * method)410 uint8_t* JitCodeCache::ReserveData(Thread* self, size_t size, ArtMethod* method) {
411   size = RoundUp(size, sizeof(void*));
412   uint8_t* result = nullptr;
413 
414   {
415     ScopedThreadSuspension sts(self, kSuspended);
416     MutexLock mu(self, lock_);
417     WaitForPotentialCollectionToComplete(self);
418     result = AllocateData(size);
419   }
420 
421   if (result == nullptr) {
422     // Retry.
423     GarbageCollectCache(self);
424     ScopedThreadSuspension sts(self, kSuspended);
425     MutexLock mu(self, lock_);
426     WaitForPotentialCollectionToComplete(self);
427     result = AllocateData(size);
428   }
429 
430   MutexLock mu(self, lock_);
431   histogram_stack_map_memory_use_.AddValue(size);
432   if (size > kStackMapSizeLogThreshold) {
433     LOG(INFO) << "JIT allocated "
434               << PrettySize(size)
435               << " for stack maps of "
436               << PrettyMethod(method);
437   }
438   return result;
439 }
440 
441 class MarkCodeVisitor FINAL : public StackVisitor {
442  public:
MarkCodeVisitor(Thread * thread_in,JitCodeCache * code_cache_in)443   MarkCodeVisitor(Thread* thread_in, JitCodeCache* code_cache_in)
444       : StackVisitor(thread_in, nullptr, StackVisitor::StackWalkKind::kSkipInlinedFrames),
445         code_cache_(code_cache_in),
446         bitmap_(code_cache_->GetLiveBitmap()) {}
447 
VisitFrame()448   bool VisitFrame() OVERRIDE SHARED_REQUIRES(Locks::mutator_lock_) {
449     const OatQuickMethodHeader* method_header = GetCurrentOatQuickMethodHeader();
450     if (method_header == nullptr) {
451       return true;
452     }
453     const void* code = method_header->GetCode();
454     if (code_cache_->ContainsPc(code)) {
455       // Use the atomic set version, as multiple threads are executing this code.
456       bitmap_->AtomicTestAndSet(FromCodeToAllocation(code));
457     }
458     return true;
459   }
460 
461  private:
462   JitCodeCache* const code_cache_;
463   CodeCacheBitmap* const bitmap_;
464 };
465 
466 class MarkCodeClosure FINAL : public Closure {
467  public:
MarkCodeClosure(JitCodeCache * code_cache,Barrier * barrier)468   MarkCodeClosure(JitCodeCache* code_cache, Barrier* barrier)
469       : code_cache_(code_cache), barrier_(barrier) {}
470 
Run(Thread * thread)471   void Run(Thread* thread) OVERRIDE SHARED_REQUIRES(Locks::mutator_lock_) {
472     ScopedTrace trace(__PRETTY_FUNCTION__);
473     DCHECK(thread == Thread::Current() || thread->IsSuspended());
474     MarkCodeVisitor visitor(thread, code_cache_);
475     visitor.WalkStack();
476     if (kIsDebugBuild) {
477       // The stack walking code queries the side instrumentation stack if it
478       // sees an instrumentation exit pc, so the JIT code of methods in that stack
479       // must have been seen. We sanity check this below.
480       for (const instrumentation::InstrumentationStackFrame& frame
481               : *thread->GetInstrumentationStack()) {
482         // The 'method_' in InstrumentationStackFrame is the one that has return_pc_ in
483         // its stack frame, it is not the method owning return_pc_. We just pass null to
484         // LookupMethodHeader: the method is only checked against in debug builds.
485         OatQuickMethodHeader* method_header =
486             code_cache_->LookupMethodHeader(frame.return_pc_, nullptr);
487         if (method_header != nullptr) {
488           const void* code = method_header->GetCode();
489           CHECK(code_cache_->GetLiveBitmap()->Test(FromCodeToAllocation(code)));
490         }
491       }
492     }
493     barrier_->Pass(Thread::Current());
494   }
495 
496  private:
497   JitCodeCache* const code_cache_;
498   Barrier* const barrier_;
499 };
500 
NotifyCollectionDone(Thread * self)501 void JitCodeCache::NotifyCollectionDone(Thread* self) {
502   collection_in_progress_ = false;
503   lock_cond_.Broadcast(self);
504 }
505 
SetFootprintLimit(size_t new_footprint)506 void JitCodeCache::SetFootprintLimit(size_t new_footprint) {
507   size_t per_space_footprint = new_footprint / 2;
508   DCHECK(IsAlignedParam(per_space_footprint, kPageSize));
509   DCHECK_EQ(per_space_footprint * 2, new_footprint);
510   mspace_set_footprint_limit(data_mspace_, per_space_footprint);
511   {
512     ScopedCodeCacheWrite scc(code_map_.get());
513     mspace_set_footprint_limit(code_mspace_, per_space_footprint);
514   }
515 }
516 
IncreaseCodeCacheCapacity()517 bool JitCodeCache::IncreaseCodeCacheCapacity() {
518   if (current_capacity_ == max_capacity_) {
519     return false;
520   }
521 
522   // Double the capacity if we're below 1MB, or increase it by 1MB if
523   // we're above.
524   if (current_capacity_ < 1 * MB) {
525     current_capacity_ *= 2;
526   } else {
527     current_capacity_ += 1 * MB;
528   }
529   if (current_capacity_ > max_capacity_) {
530     current_capacity_ = max_capacity_;
531   }
532 
533   if (!kIsDebugBuild || VLOG_IS_ON(jit)) {
534     LOG(INFO) << "Increasing code cache capacity to " << PrettySize(current_capacity_);
535   }
536 
537   SetFootprintLimit(current_capacity_);
538 
539   return true;
540 }
541 
MarkCompiledCodeOnThreadStacks(Thread * self)542 void JitCodeCache::MarkCompiledCodeOnThreadStacks(Thread* self) {
543   Barrier barrier(0);
544   size_t threads_running_checkpoint = 0;
545   MarkCodeClosure closure(this, &barrier);
546   threads_running_checkpoint = Runtime::Current()->GetThreadList()->RunCheckpoint(&closure);
547   // Now that we have run our checkpoint, move to a suspended state and wait
548   // for other threads to run the checkpoint.
549   ScopedThreadSuspension sts(self, kSuspended);
550   if (threads_running_checkpoint != 0) {
551     barrier.Increment(self, threads_running_checkpoint);
552   }
553 }
554 
ShouldDoFullCollection()555 bool JitCodeCache::ShouldDoFullCollection() {
556   if (current_capacity_ == max_capacity_) {
557     // Always do a full collection when the code cache is full.
558     return true;
559   } else if (current_capacity_ < kReservedCapacity) {
560     // Always do partial collection when the code cache size is below the reserved
561     // capacity.
562     return false;
563   } else if (last_collection_increased_code_cache_) {
564     // This time do a full collection.
565     return true;
566   } else {
567     // This time do a partial collection.
568     return false;
569   }
570 }
571 
GarbageCollectCache(Thread * self)572 void JitCodeCache::GarbageCollectCache(Thread* self) {
573   ScopedTrace trace(__FUNCTION__);
574   if (!garbage_collect_code_) {
575     MutexLock mu(self, lock_);
576     IncreaseCodeCacheCapacity();
577     return;
578   }
579 
580   // Wait for an existing collection, or let everyone know we are starting one.
581   {
582     ScopedThreadSuspension sts(self, kSuspended);
583     MutexLock mu(self, lock_);
584     if (WaitForPotentialCollectionToComplete(self)) {
585       return;
586     } else {
587       number_of_collections_++;
588       live_bitmap_.reset(CodeCacheBitmap::Create(
589           "code-cache-bitmap",
590           reinterpret_cast<uintptr_t>(code_map_->Begin()),
591           reinterpret_cast<uintptr_t>(code_map_->Begin() + current_capacity_ / 2)));
592       collection_in_progress_ = true;
593     }
594   }
595 
596   TimingLogger logger("JIT code cache timing logger", true, VLOG_IS_ON(jit));
597   {
598     TimingLogger::ScopedTiming st("Code cache collection", &logger);
599 
600     bool do_full_collection = false;
601     {
602       MutexLock mu(self, lock_);
603       do_full_collection = ShouldDoFullCollection();
604     }
605 
606     if (!kIsDebugBuild || VLOG_IS_ON(jit)) {
607       LOG(INFO) << "Do "
608                 << (do_full_collection ? "full" : "partial")
609                 << " code cache collection, code="
610                 << PrettySize(CodeCacheSize())
611                 << ", data=" << PrettySize(DataCacheSize());
612     }
613 
614     DoCollection(self, /* collect_profiling_info */ do_full_collection);
615 
616     if (!kIsDebugBuild || VLOG_IS_ON(jit)) {
617       LOG(INFO) << "After code cache collection, code="
618                 << PrettySize(CodeCacheSize())
619                 << ", data=" << PrettySize(DataCacheSize());
620     }
621 
622     {
623       MutexLock mu(self, lock_);
624 
625       // Increase the code cache only when we do partial collections.
626       // TODO: base this strategy on how full the code cache is?
627       if (do_full_collection) {
628         last_collection_increased_code_cache_ = false;
629       } else {
630         last_collection_increased_code_cache_ = true;
631         IncreaseCodeCacheCapacity();
632       }
633 
634       bool next_collection_will_be_full = ShouldDoFullCollection();
635 
636       // Start polling the liveness of compiled code to prepare for the next full collection.
637       if (next_collection_will_be_full) {
638         // Save the entry point of methods we have compiled, and update the entry
639         // point of those methods to the interpreter. If the method is invoked, the
640         // interpreter will update its entry point to the compiled code and call it.
641         for (ProfilingInfo* info : profiling_infos_) {
642           const void* entry_point = info->GetMethod()->GetEntryPointFromQuickCompiledCode();
643           if (ContainsPc(entry_point)) {
644             info->SetSavedEntryPoint(entry_point);
645             Runtime::Current()->GetInstrumentation()->UpdateMethodsCode(
646                 info->GetMethod(), GetQuickToInterpreterBridge());
647           }
648         }
649 
650         DCHECK(CheckLiveCompiledCodeHasProfilingInfo());
651       }
652       live_bitmap_.reset(nullptr);
653       NotifyCollectionDone(self);
654     }
655   }
656   Runtime::Current()->GetJit()->AddTimingLogger(logger);
657 }
658 
RemoveUnmarkedCode(Thread * self)659 void JitCodeCache::RemoveUnmarkedCode(Thread* self) {
660   ScopedTrace trace(__FUNCTION__);
661   MutexLock mu(self, lock_);
662   ScopedCodeCacheWrite scc(code_map_.get());
663   // Iterate over all compiled code and remove entries that are not marked.
664   for (auto it = method_code_map_.begin(); it != method_code_map_.end();) {
665     const void* code_ptr = it->first;
666     ArtMethod* method = it->second;
667     uintptr_t allocation = FromCodeToAllocation(code_ptr);
668     if (GetLiveBitmap()->Test(allocation)) {
669       ++it;
670     } else {
671       FreeCode(code_ptr, method);
672       it = method_code_map_.erase(it);
673     }
674   }
675 }
676 
DoCollection(Thread * self,bool collect_profiling_info)677 void JitCodeCache::DoCollection(Thread* self, bool collect_profiling_info) {
678   ScopedTrace trace(__FUNCTION__);
679   {
680     MutexLock mu(self, lock_);
681     if (collect_profiling_info) {
682       // Clear the profiling info of methods that do not have compiled code as entrypoint.
683       // Also remove the saved entry point from the ProfilingInfo objects.
684       for (ProfilingInfo* info : profiling_infos_) {
685         const void* ptr = info->GetMethod()->GetEntryPointFromQuickCompiledCode();
686         if (!ContainsPc(ptr) && !info->IsInUseByCompiler()) {
687           info->GetMethod()->SetProfilingInfo(nullptr);
688         }
689 
690         if (info->GetSavedEntryPoint() != nullptr) {
691           info->SetSavedEntryPoint(nullptr);
692           // We are going to move this method back to interpreter. Clear the counter now to
693           // give it a chance to be hot again.
694           info->GetMethod()->ClearCounter();
695         }
696       }
697     } else if (kIsDebugBuild) {
698       // Sanity check that the profiling infos do not have a dangling entry point.
699       for (ProfilingInfo* info : profiling_infos_) {
700         DCHECK(info->GetSavedEntryPoint() == nullptr);
701       }
702     }
703 
704     // Mark compiled code that are entrypoints of ArtMethods. Compiled code that is not
705     // an entry point is either:
706     // - an osr compiled code, that will be removed if not in a thread call stack.
707     // - discarded compiled code, that will be removed if not in a thread call stack.
708     for (const auto& it : method_code_map_) {
709       ArtMethod* method = it.second;
710       const void* code_ptr = it.first;
711       const OatQuickMethodHeader* method_header = OatQuickMethodHeader::FromCodePointer(code_ptr);
712       if (method_header->GetEntryPoint() == method->GetEntryPointFromQuickCompiledCode()) {
713         GetLiveBitmap()->AtomicTestAndSet(FromCodeToAllocation(code_ptr));
714       }
715     }
716 
717     // Empty osr method map, as osr compiled code will be deleted (except the ones
718     // on thread stacks).
719     osr_code_map_.clear();
720   }
721 
722   // Run a checkpoint on all threads to mark the JIT compiled code they are running.
723   MarkCompiledCodeOnThreadStacks(self);
724 
725   // At this point, mutator threads are still running, and entrypoints of methods can
726   // change. We do know they cannot change to a code cache entry that is not marked,
727   // therefore we can safely remove those entries.
728   RemoveUnmarkedCode(self);
729 
730   if (collect_profiling_info) {
731     ScopedThreadSuspension sts(self, kSuspended);
732     gc::ScopedGCCriticalSection gcs(
733         self, gc::kGcCauseJitCodeCache, gc::kCollectorTypeJitCodeCache);
734     MutexLock mu(self, lock_);
735     // Free all profiling infos of methods not compiled nor being compiled.
736     auto profiling_kept_end = std::remove_if(profiling_infos_.begin(), profiling_infos_.end(),
737       [this] (ProfilingInfo* info) NO_THREAD_SAFETY_ANALYSIS {
738         const void* ptr = info->GetMethod()->GetEntryPointFromQuickCompiledCode();
739         // We have previously cleared the ProfilingInfo pointer in the ArtMethod in the hope
740         // that the compiled code would not get revived. As mutator threads run concurrently,
741         // they may have revived the compiled code, and now we are in the situation where
742         // a method has compiled code but no ProfilingInfo.
743         // We make sure compiled methods have a ProfilingInfo object. It is needed for
744         // code cache collection.
745         if (ContainsPc(ptr) && info->GetMethod()->GetProfilingInfo(sizeof(void*)) == nullptr) {
746           // We clear the inline caches as classes in it might be stalled.
747           info->ClearGcRootsInInlineCaches();
748           // Do a fence to make sure the clearing is seen before attaching to the method.
749           QuasiAtomic::ThreadFenceRelease();
750           info->GetMethod()->SetProfilingInfo(info);
751         } else if (info->GetMethod()->GetProfilingInfo(sizeof(void*)) != info) {
752           // No need for this ProfilingInfo object anymore.
753           FreeData(reinterpret_cast<uint8_t*>(info));
754           return true;
755         }
756         return false;
757       });
758     profiling_infos_.erase(profiling_kept_end, profiling_infos_.end());
759     DCHECK(CheckLiveCompiledCodeHasProfilingInfo());
760   }
761 }
762 
CheckLiveCompiledCodeHasProfilingInfo()763 bool JitCodeCache::CheckLiveCompiledCodeHasProfilingInfo() {
764   ScopedTrace trace(__FUNCTION__);
765   // Check that methods we have compiled do have a ProfilingInfo object. We would
766   // have memory leaks of compiled code otherwise.
767   for (const auto& it : method_code_map_) {
768     ArtMethod* method = it.second;
769     if (method->GetProfilingInfo(sizeof(void*)) == nullptr) {
770       const void* code_ptr = it.first;
771       const OatQuickMethodHeader* method_header = OatQuickMethodHeader::FromCodePointer(code_ptr);
772       if (method_header->GetEntryPoint() == method->GetEntryPointFromQuickCompiledCode()) {
773         // If the code is not dead, then we have a problem. Note that this can even
774         // happen just after a collection, as mutator threads are running in parallel
775         // and could deoptimize an existing compiled code.
776         return false;
777       }
778     }
779   }
780   return true;
781 }
782 
LookupMethodHeader(uintptr_t pc,ArtMethod * method)783 OatQuickMethodHeader* JitCodeCache::LookupMethodHeader(uintptr_t pc, ArtMethod* method) {
784   static_assert(kRuntimeISA != kThumb2, "kThumb2 cannot be a runtime ISA");
785   if (kRuntimeISA == kArm) {
786     // On Thumb-2, the pc is offset by one.
787     --pc;
788   }
789   if (!ContainsPc(reinterpret_cast<const void*>(pc))) {
790     return nullptr;
791   }
792 
793   MutexLock mu(Thread::Current(), lock_);
794   if (method_code_map_.empty()) {
795     return nullptr;
796   }
797   auto it = method_code_map_.lower_bound(reinterpret_cast<const void*>(pc));
798   --it;
799 
800   const void* code_ptr = it->first;
801   OatQuickMethodHeader* method_header = OatQuickMethodHeader::FromCodePointer(code_ptr);
802   if (!method_header->Contains(pc)) {
803     return nullptr;
804   }
805   if (kIsDebugBuild && method != nullptr) {
806     DCHECK_EQ(it->second, method)
807         << PrettyMethod(method) << " " << PrettyMethod(it->second) << " " << std::hex << pc;
808   }
809   return method_header;
810 }
811 
LookupOsrMethodHeader(ArtMethod * method)812 OatQuickMethodHeader* JitCodeCache::LookupOsrMethodHeader(ArtMethod* method) {
813   MutexLock mu(Thread::Current(), lock_);
814   auto it = osr_code_map_.find(method);
815   if (it == osr_code_map_.end()) {
816     return nullptr;
817   }
818   return OatQuickMethodHeader::FromCodePointer(it->second);
819 }
820 
AddProfilingInfo(Thread * self,ArtMethod * method,const std::vector<uint32_t> & entries,bool retry_allocation)821 ProfilingInfo* JitCodeCache::AddProfilingInfo(Thread* self,
822                                               ArtMethod* method,
823                                               const std::vector<uint32_t>& entries,
824                                               bool retry_allocation)
825     // No thread safety analysis as we are using TryLock/Unlock explicitly.
826     NO_THREAD_SAFETY_ANALYSIS {
827   ProfilingInfo* info = nullptr;
828   if (!retry_allocation) {
829     // If we are allocating for the interpreter, just try to lock, to avoid
830     // lock contention with the JIT.
831     if (lock_.ExclusiveTryLock(self)) {
832       info = AddProfilingInfoInternal(self, method, entries);
833       lock_.ExclusiveUnlock(self);
834     }
835   } else {
836     {
837       MutexLock mu(self, lock_);
838       info = AddProfilingInfoInternal(self, method, entries);
839     }
840 
841     if (info == nullptr) {
842       GarbageCollectCache(self);
843       MutexLock mu(self, lock_);
844       info = AddProfilingInfoInternal(self, method, entries);
845     }
846   }
847   return info;
848 }
849 
AddProfilingInfoInternal(Thread * self ATTRIBUTE_UNUSED,ArtMethod * method,const std::vector<uint32_t> & entries)850 ProfilingInfo* JitCodeCache::AddProfilingInfoInternal(Thread* self ATTRIBUTE_UNUSED,
851                                                       ArtMethod* method,
852                                                       const std::vector<uint32_t>& entries) {
853   size_t profile_info_size = RoundUp(
854       sizeof(ProfilingInfo) + sizeof(InlineCache) * entries.size(),
855       sizeof(void*));
856 
857   // Check whether some other thread has concurrently created it.
858   ProfilingInfo* info = method->GetProfilingInfo(sizeof(void*));
859   if (info != nullptr) {
860     return info;
861   }
862 
863   uint8_t* data = AllocateData(profile_info_size);
864   if (data == nullptr) {
865     return nullptr;
866   }
867   info = new (data) ProfilingInfo(method, entries);
868 
869   // Make sure other threads see the data in the profiling info object before the
870   // store in the ArtMethod's ProfilingInfo pointer.
871   QuasiAtomic::ThreadFenceRelease();
872 
873   method->SetProfilingInfo(info);
874   profiling_infos_.push_back(info);
875   histogram_profiling_info_memory_use_.AddValue(profile_info_size);
876   return info;
877 }
878 
879 // NO_THREAD_SAFETY_ANALYSIS as this is called from mspace code, at which point the lock
880 // is already held.
MoreCore(const void * mspace,intptr_t increment)881 void* JitCodeCache::MoreCore(const void* mspace, intptr_t increment) NO_THREAD_SAFETY_ANALYSIS {
882   if (code_mspace_ == mspace) {
883     size_t result = code_end_;
884     code_end_ += increment;
885     return reinterpret_cast<void*>(result + code_map_->Begin());
886   } else {
887     DCHECK_EQ(data_mspace_, mspace);
888     size_t result = data_end_;
889     data_end_ += increment;
890     return reinterpret_cast<void*>(result + data_map_->Begin());
891   }
892 }
893 
GetProfiledMethods(const std::set<std::string> & dex_base_locations,std::vector<MethodReference> & methods)894 void JitCodeCache::GetProfiledMethods(const std::set<std::string>& dex_base_locations,
895                                       std::vector<MethodReference>& methods) {
896   ScopedTrace trace(__FUNCTION__);
897   MutexLock mu(Thread::Current(), lock_);
898   for (const ProfilingInfo* info : profiling_infos_) {
899     ArtMethod* method = info->GetMethod();
900     const DexFile* dex_file = method->GetDexFile();
901     if (ContainsElement(dex_base_locations, dex_file->GetBaseLocation())) {
902       methods.emplace_back(dex_file,  method->GetDexMethodIndex());
903     }
904   }
905 }
906 
GetLastUpdateTimeNs() const907 uint64_t JitCodeCache::GetLastUpdateTimeNs() const {
908   return last_update_time_ns_.LoadAcquire();
909 }
910 
IsOsrCompiled(ArtMethod * method)911 bool JitCodeCache::IsOsrCompiled(ArtMethod* method) {
912   MutexLock mu(Thread::Current(), lock_);
913   return osr_code_map_.find(method) != osr_code_map_.end();
914 }
915 
NotifyCompilationOf(ArtMethod * method,Thread * self,bool osr)916 bool JitCodeCache::NotifyCompilationOf(ArtMethod* method, Thread* self, bool osr) {
917   if (!osr && ContainsPc(method->GetEntryPointFromQuickCompiledCode())) {
918     return false;
919   }
920 
921   MutexLock mu(self, lock_);
922   if (osr && (osr_code_map_.find(method) != osr_code_map_.end())) {
923     return false;
924   }
925 
926   ProfilingInfo* info = method->GetProfilingInfo(sizeof(void*));
927   if (info == nullptr) {
928     VLOG(jit) << PrettyMethod(method) << " needs a ProfilingInfo to be compiled";
929     // Because the counter is not atomic, there are some rare cases where we may not
930     // hit the threshold for creating the ProfilingInfo. Reset the counter now to
931     // "correct" this.
932     method->ClearCounter();
933     return false;
934   }
935 
936   if (info->IsMethodBeingCompiled(osr)) {
937     return false;
938   }
939 
940   info->SetIsMethodBeingCompiled(true, osr);
941   return true;
942 }
943 
NotifyCompilerUse(ArtMethod * method,Thread * self)944 ProfilingInfo* JitCodeCache::NotifyCompilerUse(ArtMethod* method, Thread* self) {
945   MutexLock mu(self, lock_);
946   ProfilingInfo* info = method->GetProfilingInfo(sizeof(void*));
947   if (info != nullptr) {
948     info->IncrementInlineUse();
949   }
950   return info;
951 }
952 
DoneCompilerUse(ArtMethod * method,Thread * self)953 void JitCodeCache::DoneCompilerUse(ArtMethod* method, Thread* self) {
954   MutexLock mu(self, lock_);
955   ProfilingInfo* info = method->GetProfilingInfo(sizeof(void*));
956   DCHECK(info != nullptr);
957   info->DecrementInlineUse();
958 }
959 
DoneCompiling(ArtMethod * method,Thread * self ATTRIBUTE_UNUSED,bool osr)960 void JitCodeCache::DoneCompiling(ArtMethod* method, Thread* self ATTRIBUTE_UNUSED, bool osr) {
961   ProfilingInfo* info = method->GetProfilingInfo(sizeof(void*));
962   DCHECK(info->IsMethodBeingCompiled(osr));
963   info->SetIsMethodBeingCompiled(false, osr);
964 }
965 
GetMemorySizeOfCodePointer(const void * ptr)966 size_t JitCodeCache::GetMemorySizeOfCodePointer(const void* ptr) {
967   MutexLock mu(Thread::Current(), lock_);
968   return mspace_usable_size(reinterpret_cast<const void*>(FromCodeToAllocation(ptr)));
969 }
970 
InvalidateCompiledCodeFor(ArtMethod * method,const OatQuickMethodHeader * header)971 void JitCodeCache::InvalidateCompiledCodeFor(ArtMethod* method,
972                                              const OatQuickMethodHeader* header) {
973   ProfilingInfo* profiling_info = method->GetProfilingInfo(sizeof(void*));
974   if ((profiling_info != nullptr) &&
975       (profiling_info->GetSavedEntryPoint() == header->GetEntryPoint())) {
976     // Prevent future uses of the compiled code.
977     profiling_info->SetSavedEntryPoint(nullptr);
978   }
979 
980   if (method->GetEntryPointFromQuickCompiledCode() == header->GetEntryPoint()) {
981     // The entrypoint is the one to invalidate, so we just update
982     // it to the interpreter entry point and clear the counter to get the method
983     // Jitted again.
984     Runtime::Current()->GetInstrumentation()->UpdateMethodsCode(
985         method, GetQuickToInterpreterBridge());
986     method->ClearCounter();
987   } else {
988     MutexLock mu(Thread::Current(), lock_);
989     auto it = osr_code_map_.find(method);
990     if (it != osr_code_map_.end() && OatQuickMethodHeader::FromCodePointer(it->second) == header) {
991       // Remove the OSR method, to avoid using it again.
992       osr_code_map_.erase(it);
993     }
994   }
995   MutexLock mu(Thread::Current(), lock_);
996   number_of_deoptimizations_++;
997 }
998 
AllocateCode(size_t code_size)999 uint8_t* JitCodeCache::AllocateCode(size_t code_size) {
1000   size_t alignment = GetInstructionSetAlignment(kRuntimeISA);
1001   uint8_t* result = reinterpret_cast<uint8_t*>(
1002       mspace_memalign(code_mspace_, alignment, code_size));
1003   size_t header_size = RoundUp(sizeof(OatQuickMethodHeader), alignment);
1004   // Ensure the header ends up at expected instruction alignment.
1005   DCHECK_ALIGNED_PARAM(reinterpret_cast<uintptr_t>(result + header_size), alignment);
1006   used_memory_for_code_ += mspace_usable_size(result);
1007   return result;
1008 }
1009 
FreeCode(uint8_t * code)1010 void JitCodeCache::FreeCode(uint8_t* code) {
1011   used_memory_for_code_ -= mspace_usable_size(code);
1012   mspace_free(code_mspace_, code);
1013 }
1014 
AllocateData(size_t data_size)1015 uint8_t* JitCodeCache::AllocateData(size_t data_size) {
1016   void* result = mspace_malloc(data_mspace_, data_size);
1017   used_memory_for_data_ += mspace_usable_size(result);
1018   return reinterpret_cast<uint8_t*>(result);
1019 }
1020 
FreeData(uint8_t * data)1021 void JitCodeCache::FreeData(uint8_t* data) {
1022   used_memory_for_data_ -= mspace_usable_size(data);
1023   mspace_free(data_mspace_, data);
1024 }
1025 
Dump(std::ostream & os)1026 void JitCodeCache::Dump(std::ostream& os) {
1027   MutexLock mu(Thread::Current(), lock_);
1028   os << "Current JIT code cache size: " << PrettySize(used_memory_for_code_) << "\n"
1029      << "Current JIT data cache size: " << PrettySize(used_memory_for_data_) << "\n"
1030      << "Current JIT capacity: " << PrettySize(current_capacity_) << "\n"
1031      << "Current number of JIT code cache entries: " << method_code_map_.size() << "\n"
1032      << "Total number of JIT compilations: " << number_of_compilations_ << "\n"
1033      << "Total number of JIT compilations for on stack replacement: "
1034         << number_of_osr_compilations_ << "\n"
1035      << "Total number of deoptimizations: " << number_of_deoptimizations_ << "\n"
1036      << "Total number of JIT code cache collections: " << number_of_collections_ << std::endl;
1037   histogram_stack_map_memory_use_.PrintMemoryUse(os);
1038   histogram_code_memory_use_.PrintMemoryUse(os);
1039   histogram_profiling_info_memory_use_.PrintMemoryUse(os);
1040 }
1041 
1042 }  // namespace jit
1043 }  // namespace art
1044