Cache the value of MterpShouldSwitchInterpreters() Add field to the Thread object which stores the value instead (negated). Explicitly update the field when relevant state changes (which is rare). This speeds up golem interpreter benchmarks by 3.5% on average with some benchmarks up to 15% faster. Test: test.py -b -r --interpreter --host Change-Id: If2df0d3bf9e69ab50c30102b2648e997927c34d8

commit: 28f6cff854b61e39f953e69ebf3646ee9826ec82 [log] [tgz]
author: David Srbecky <dsrbecky@google.com> Tue Oct 16 15:07:28 2018 +0100
committer: David Srbecky <dsrbecky@google.com> Mon Oct 22 14:35:07 2018 +0100
tree: a98e2bf1746d93079b7abe54e278ba87f0aef360
parent: 06ef9aa6a562a3a1f7c1f9b91aadda5018f8ba86 [diff] [blame]
diff --git a/runtime/runtime-inl.h b/runtime/runtime-inl.h
index bde0d11..e6cc471 100644
--- a/runtime/runtime-inl.h
+++ b/runtime/runtime-inl.h

@@ -25,7 +25,9 @@
 #include "base/casts.h"
 #include "entrypoints/quick/callee_save_frame.h"
 #include "gc_root-inl.h"
+#include "interpreter/mterp/mterp.h"
 #include "obj_ptr-inl.h"
+#include "thread_list.h"
 
 namespace art {
 
@@ -86,6 +88,15 @@
   return reinterpret_cast64<ArtMethod*>(callee_save_methods_[static_cast<size_t>(type)]);
 }
 
+template<typename Action>
+void Runtime::DoAndMaybeSwitchInterpreter(Action lamda) {
+  MutexLock tll_mu(Thread::Current(), *Locks::thread_list_lock_);
+  lamda();
+  Runtime::Current()->GetThreadList()->ForEach([](Thread* thread, void*) {
+      thread->tls32_.use_mterp.store(interpreter::CanUseMterp());
+  }, nullptr);
+}
+
 }  // namespace art
 
 #endif  // ART_RUNTIME_RUNTIME_INL_H_
commit	28f6cff854b61e39f953e69ebf3646ee9826ec82	[log] [tgz]
author	David Srbecky <dsrbecky@google.com>	Tue Oct 16 15:07:28 2018 +0100
committer	David Srbecky <dsrbecky@google.com>	Mon Oct 22 14:35:07 2018 +0100
tree	a98e2bf1746d93079b7abe54e278ba87f0aef360
parent	06ef9aa6a562a3a1f7c1f9b91aadda5018f8ba86 [diff] [blame]