Make .bss stores atomic release operations. And rely on architecture-dependent behavior for the .bss entry loads. This fixes theoretical races when one thread updates the .bss entry and another uses it immediately thereafter; previously we did not ensure correct memory visibility. Test: m test-art-host-gtest Test: testrunner.py --host --optimizing Test: aosp_taimen-userdebug boots. Test: run-gtests.sh Test: testrunner.py --target --optimizing Change-Id: Ie7b7969eb355025b9c9205f8c936e702861943f4

commit: d5fd5c3bbb44880e440c6920ce5ed56b5383c788 [log] [tgz]
author: Vladimir Marko <vmarko@google.com> Tue Jul 02 14:46:32 2019 +0100
committer: Vladimir Marko <vmarko@google.com> Thu Jul 04 08:17:30 2019 +0000
tree: 2cf8a6354e5509c5a5e0bc2937c24fe7e03a12b1
parent: 1a6f9fcce199f437a5945dfe0163188b923adb28 [diff] [blame]
diff --git a/compiler/optimizing/code_generator_x86_64.cc b/compiler/optimizing/code_generator_x86_64.cc
index bdd080b..17edc74 100644
--- a/compiler/optimizing/code_generator_x86_64.cc
+++ b/compiler/optimizing/code_generator_x86_64.cc

@@ -1015,6 +1015,7 @@
       __ movq(temp.AsRegister<CpuRegister>(),
               Address::Absolute(kDummy32BitOffset, /* no_rip= */ false));
       RecordMethodBssEntryPatch(invoke);
+      // No need for memory fence, thanks to the x86-64 memory model.
       break;
     }
     case HInvokeStaticOrDirect::MethodLoadKind::kJitDirectAddress:
@@ -5980,6 +5981,7 @@
       Label* fixup_label = codegen_->NewTypeBssEntryPatch(cls);
       // /* GcRoot<mirror::Class> */ out = *address  /* PC-relative */
       GenerateGcRootFieldLoad(cls, out_loc, address, fixup_label, read_barrier_option);
+      // No need for memory fence, thanks to the x86-64 memory model.
       generate_null_check = true;
       break;
     }
@@ -6133,6 +6135,7 @@
       Label* fixup_label = codegen_->NewStringBssEntryPatch(load);
       // /* GcRoot<mirror::Class> */ out = *address  /* PC-relative */
       GenerateGcRootFieldLoad(load, out_loc, address, fixup_label, kCompilerReadBarrierOption);
+      // No need for memory fence, thanks to the x86-64 memory model.
       SlowPathCode* slow_path = new (codegen_->GetScopedAllocator()) LoadStringSlowPathX86_64(load);
       codegen_->AddSlowPath(slow_path);
       __ testl(out, out);
commit	d5fd5c3bbb44880e440c6920ce5ed56b5383c788	[log] [tgz]
author	Vladimir Marko <vmarko@google.com>	Tue Jul 02 14:46:32 2019 +0100
committer	Vladimir Marko <vmarko@google.com>	Thu Jul 04 08:17:30 2019 +0000
tree	2cf8a6354e5509c5a5e0bc2937c24fe7e03a12b1
parent	1a6f9fcce199f437a5945dfe0163188b923adb28 [diff] [blame]