src/hotspot/os_cpu/linux_arm/orderAccess_linux_arm.inline.hpp - platform/libcore - Gitiles

 /*
  * Copyright (c) 2008, 2017, Oracle and/or its affiliates. All rights reserved.
  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
  *
  * This code is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License version 2 only, as
  * published by the Free Software Foundation.
  *
  * This code is distributed in the hope that it will be useful, but WITHOUT
  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  * version 2 for more details (a copy is included in the LICENSE file that
  * accompanied this code).
  *
  * You should have received a copy of the GNU General Public License version
  * 2 along with this work; if not, write to the Free Software Foundation,
  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  *
  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  * or visit www.oracle.com if you need additional information or have any
  * questions.
  *
  */

 #ifndef OS_CPU_LINUX_ARM_VM_ORDERACCESS_LINUX_ARM_INLINE_HPP
 #define OS_CPU_LINUX_ARM_VM_ORDERACCESS_LINUX_ARM_INLINE_HPP

 #include "runtime/orderAccess.hpp"
 #include "runtime/os.hpp"
 #include "vm_version_arm.hpp"

 // Implementation of class OrderAccess.
 // - we define the high level barriers below and use the general
 //   implementation in orderAccess.inline.hpp, with customizations
 //   on AARCH64 via the specialized_* template functions
 #define VM_HAS_GENERALIZED_ORDER_ACCESS 1

 // Memory Ordering on ARM is weak.
 //
 // Implement all 4 memory ordering barriers by DMB, since it is a
 // lighter version of DSB.
 // dmb_sy implies full system shareability domain. RD/WR access type.
 // dmb_st implies full system shareability domain. WR only access type.
 //
 // NOP on < ARMv6 (MP not supported)
 //
 // Non mcr instructions can be used if we build for armv7 or higher arch
 //    __asm__ __volatile__ ("dmb" : : : "memory");
 //    __asm__ __volatile__ ("dsb" : : : "memory");
 //
 // inline void _OrderAccess_dsb() {
 //    volatile intptr_t dummy = 0;
 //    if (os::is_MP()) {
 //      __asm__ volatile (
 //        "mcr p15, 0, %0, c7, c10, 4"
 //        : : "r" (dummy) : "memory");
 //   }
 // }

 inline static void dmb_sy() {
    if (!os::is_MP()) {
      return;
    }
 #ifdef AARCH64
    __asm__ __volatile__ ("dmb sy" : : : "memory");
 #else
    if (VM_Version::arm_arch() >= 7) {
 #ifdef __thumb__
      __asm__ volatile (
      "dmb sy": : : "memory");
 #else
      __asm__ volatile (
      ".word 0xF57FF050 | 0xf" : : : "memory");
 #endif
    } else {
      intptr_t zero = 0;
      __asm__ volatile (
        "mcr p15, 0, %0, c7, c10, 5"
        : : "r" (zero) : "memory");
    }
 #endif
 }

 inline static void dmb_st() {
    if (!os::is_MP()) {
      return;
    }
 #ifdef AARCH64
    __asm__ __volatile__ ("dmb st" : : : "memory");
 #else
    if (VM_Version::arm_arch() >= 7) {
 #ifdef __thumb__
      __asm__ volatile (
      "dmb st": : : "memory");
 #else
      __asm__ volatile (
      ".word 0xF57FF050 | 0xe" : : : "memory");
 #endif
    } else {
      intptr_t zero = 0;
      __asm__ volatile (
        "mcr p15, 0, %0, c7, c10, 5"
        : : "r" (zero) : "memory");
    }
 #endif
 }

 // Load-Load/Store barrier
 inline static void dmb_ld() {
 #ifdef AARCH64
    if (!os::is_MP()) {
      return;
    }
    __asm__ __volatile__ ("dmb ld" : : : "memory");
 #else
    dmb_sy();
 #endif
 }


 inline void OrderAccess::loadload()   { dmb_ld(); }
 inline void OrderAccess::loadstore()  { dmb_ld(); }
 inline void OrderAccess::acquire()    { dmb_ld(); }
 inline void OrderAccess::storestore() { dmb_st(); }
 inline void OrderAccess::storeload()  { dmb_sy(); }
 inline void OrderAccess::release()    { dmb_sy(); }
 inline void OrderAccess::fence()      { dmb_sy(); }

 // specializations for Aarch64
 // TODO-AARCH64: evaluate effectiveness of ldar*/stlr* implementations compared to 32-bit ARM approach

 #ifdef AARCH64

 template<> inline jbyte    OrderAccess::specialized_load_acquire<jbyte>(const volatile jbyte*   p) {
   volatile jbyte result;
   __asm__ volatile(
     "ldarb %w[res], [%[ptr]]"
     : [res] "=&r" (result)
     : [ptr] "r" (p)
     : "memory");
   return result;
 }

 template<> inline jshort   OrderAccess::specialized_load_acquire<jshort>(const volatile jshort*  p) {
   volatile jshort result;
   __asm__ volatile(
     "ldarh %w[res], [%[ptr]]"
     : [res] "=&r" (result)
     : [ptr] "r" (p)
     : "memory");
   return result;
 }

 template<> inline jint     OrderAccess::specialized_load_acquire<jint>(const volatile jint*    p) {
   volatile jint result;
   __asm__ volatile(
     "ldar %w[res], [%[ptr]]"
     : [res] "=&r" (result)
     : [ptr] "r" (p)
     : "memory");
   return result;
 }

 template<> inline jfloat   OrderAccess::specialized_load_acquire<jfloat>(const volatile jfloat*  p) {
   return jfloat_cast(specialized_load_acquire((const volatile jint*)p));
 }

 // This is implicit as jlong and intptr_t are both "long int"
 //template<> inline jlong    OrderAccess::specialized_load_acquire(const volatile jlong*   p) {
 //  return (volatile jlong)specialized_load_acquire((const volatile intptr_t*)p);
 //}

 template<> inline intptr_t OrderAccess::specialized_load_acquire<intptr_t>(const volatile intptr_t*   p) {
   volatile intptr_t result;
   __asm__ volatile(
     "ldar %[res], [%[ptr]]"
     : [res] "=&r" (result)
     : [ptr] "r" (p)
     : "memory");
   return result;
 }

 template<> inline jdouble  OrderAccess::specialized_load_acquire<jdouble>(const volatile jdouble* p) {
   return jdouble_cast(specialized_load_acquire((const volatile intptr_t*)p));
 }


 template<> inline void     OrderAccess::specialized_release_store<jbyte>(volatile jbyte*   p, jbyte   v) {
   __asm__ volatile(
     "stlrb %w[val], [%[ptr]]"
     :
     : [ptr] "r" (p), [val] "r" (v)
     : "memory");
 }

 template<> inline void     OrderAccess::specialized_release_store<jshort>(volatile jshort*  p, jshort  v) {
   __asm__ volatile(
     "stlrh %w[val], [%[ptr]]"
     :
     : [ptr] "r" (p), [val] "r" (v)
     : "memory");
 }

 template<> inline void     OrderAccess::specialized_release_store<jint>(volatile jint*    p, jint    v) {
   __asm__ volatile(
     "stlr %w[val], [%[ptr]]"
     :
     : [ptr] "r" (p), [val] "r" (v)
     : "memory");
 }

 template<> inline void     OrderAccess::specialized_release_store<jlong>(volatile jlong*   p, jlong   v) {
   __asm__ volatile(
     "stlr %[val], [%[ptr]]"
     :
     : [ptr] "r" (p), [val] "r" (v)
     : "memory");
 }
 #endif // AARCH64

 #endif // OS_CPU_LINUX_ARM_VM_ORDERACCESS_LINUX_ARM_INLINE_HPP
	/*
	* Copyright (c) 2008, 2017, Oracle and/or its affiliates. All rights reserved.
	* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
	*
	* This code is free software; you can redistribute it and/or modify it
	* under the terms of the GNU General Public License version 2 only, as
	* published by the Free Software Foundation.
	*
	* This code is distributed in the hope that it will be useful, but WITHOUT
	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
	* version 2 for more details (a copy is included in the LICENSE file that
	* accompanied this code).
	*
	* You should have received a copy of the GNU General Public License version
	* 2 along with this work; if not, write to the Free Software Foundation,
	* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
	*
	* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
	* or visit www.oracle.com if you need additional information or have any
	* questions.
	*
	*/

	#ifndef OS_CPU_LINUX_ARM_VM_ORDERACCESS_LINUX_ARM_INLINE_HPP
	#define OS_CPU_LINUX_ARM_VM_ORDERACCESS_LINUX_ARM_INLINE_HPP

	#include "runtime/orderAccess.hpp"
	#include "runtime/os.hpp"
	#include "vm_version_arm.hpp"

	// Implementation of class OrderAccess.
	// - we define the high level barriers below and use the general
	// implementation in orderAccess.inline.hpp, with customizations
	// on AARCH64 via the specialized_* template functions
	#define VM_HAS_GENERALIZED_ORDER_ACCESS 1

	// Memory Ordering on ARM is weak.
	//
	// Implement all 4 memory ordering barriers by DMB, since it is a
	// lighter version of DSB.
	// dmb_sy implies full system shareability domain. RD/WR access type.
	// dmb_st implies full system shareability domain. WR only access type.
	//
	// NOP on < ARMv6 (MP not supported)
	//
	// Non mcr instructions can be used if we build for armv7 or higher arch
	// __asm__ __volatile__ ("dmb" : : : "memory");
	// __asm__ __volatile__ ("dsb" : : : "memory");
	//
	// inline void _OrderAccess_dsb() {
	// volatile intptr_t dummy = 0;
	// if (os::is_MP()) {
	// __asm__ volatile (
	// "mcr p15, 0, %0, c7, c10, 4"
	// : : "r" (dummy) : "memory");
	// }
	// }

	inline static void dmb_sy() {
	if (!os::is_MP()) {
	return;
	}
	#ifdef AARCH64
	__asm__ __volatile__ ("dmb sy" : : : "memory");
	#else
	if (VM_Version::arm_arch() >= 7) {
	#ifdef __thumb__
	__asm__ volatile (
	"dmb sy": : : "memory");
	#else
	__asm__ volatile (
	".word 0xF57FF050 \| 0xf" : : : "memory");
	#endif
	} else {
	intptr_t zero = 0;
	__asm__ volatile (
	"mcr p15, 0, %0, c7, c10, 5"
	: : "r" (zero) : "memory");
	}
	#endif
	}

	inline static void dmb_st() {
	if (!os::is_MP()) {
	return;
	}
	#ifdef AARCH64
	__asm__ __volatile__ ("dmb st" : : : "memory");
	#else
	if (VM_Version::arm_arch() >= 7) {
	#ifdef __thumb__
	__asm__ volatile (
	"dmb st": : : "memory");
	#else
	__asm__ volatile (
	".word 0xF57FF050 \| 0xe" : : : "memory");
	#endif
	} else {
	intptr_t zero = 0;
	__asm__ volatile (
	"mcr p15, 0, %0, c7, c10, 5"
	: : "r" (zero) : "memory");
	}
	#endif
	}

	// Load-Load/Store barrier
	inline static void dmb_ld() {
	#ifdef AARCH64
	if (!os::is_MP()) {
	return;
	}
	__asm__ __volatile__ ("dmb ld" : : : "memory");
	#else
	dmb_sy();
	#endif
	}


	inline void OrderAccess::loadload() { dmb_ld(); }
	inline void OrderAccess::loadstore() { dmb_ld(); }
	inline void OrderAccess::acquire() { dmb_ld(); }
	inline void OrderAccess::storestore() { dmb_st(); }
	inline void OrderAccess::storeload() { dmb_sy(); }
	inline void OrderAccess::release() { dmb_sy(); }
	inline void OrderAccess::fence() { dmb_sy(); }

	// specializations for Aarch64
	// TODO-AARCH64: evaluate effectiveness of ldar/stlr implementations compared to 32-bit ARM approach

	#ifdef AARCH64

	template<> inline jbyte OrderAccess::specialized_load_acquire<jbyte>(const volatile jbyte* p) {
	volatile jbyte result;
	__asm__ volatile(
	"ldarb %w[res], [%[ptr]]"
	: [res] "=&r" (result)
	: [ptr] "r" (p)
	: "memory");
	return result;
	}

	template<> inline jshort OrderAccess::specialized_load_acquire<jshort>(const volatile jshort* p) {
	volatile jshort result;
	__asm__ volatile(
	"ldarh %w[res], [%[ptr]]"
	: [res] "=&r" (result)
	: [ptr] "r" (p)
	: "memory");
	return result;
	}

	template<> inline jint OrderAccess::specialized_load_acquire<jint>(const volatile jint* p) {
	volatile jint result;
	__asm__ volatile(
	"ldar %w[res], [%[ptr]]"
	: [res] "=&r" (result)
	: [ptr] "r" (p)
	: "memory");
	return result;
	}

	template<> inline jfloat OrderAccess::specialized_load_acquire<jfloat>(const volatile jfloat* p) {
	return jfloat_cast(specialized_load_acquire((const volatile jint*)p));
	}

	// This is implicit as jlong and intptr_t are both "long int"
	//template<> inline jlong OrderAccess::specialized_load_acquire(const volatile jlong* p) {
	// return (volatile jlong)specialized_load_acquire((const volatile intptr_t*)p);
	//}

	template<> inline intptr_t OrderAccess::specialized_load_acquire<intptr_t>(const volatile intptr_t* p) {
	volatile intptr_t result;
	__asm__ volatile(
	"ldar %[res], [%[ptr]]"
	: [res] "=&r" (result)
	: [ptr] "r" (p)
	: "memory");
	return result;
	}

	template<> inline jdouble OrderAccess::specialized_load_acquire<jdouble>(const volatile jdouble* p) {
	return jdouble_cast(specialized_load_acquire((const volatile intptr_t*)p));
	}


	template<> inline void OrderAccess::specialized_release_store<jbyte>(volatile jbyte* p, jbyte v) {
	__asm__ volatile(
	"stlrb %w[val], [%[ptr]]"
	:
	: [ptr] "r" (p), [val] "r" (v)
	: "memory");
	}

	template<> inline void OrderAccess::specialized_release_store<jshort>(volatile jshort* p, jshort v) {
	__asm__ volatile(
	"stlrh %w[val], [%[ptr]]"
	:
	: [ptr] "r" (p), [val] "r" (v)
	: "memory");
	}

	template<> inline void OrderAccess::specialized_release_store<jint>(volatile jint* p, jint v) {
	__asm__ volatile(
	"stlr %w[val], [%[ptr]]"
	:
	: [ptr] "r" (p), [val] "r" (v)
	: "memory");
	}

	template<> inline void OrderAccess::specialized_release_store<jlong>(volatile jlong* p, jlong v) {
	__asm__ volatile(
	"stlr %[val], [%[ptr]]"
	:
	: [ptr] "r" (p), [val] "r" (v)
	: "memory");
	}
	#endif // AARCH64

	#endif // OS_CPU_LINUX_ARM_VM_ORDERACCESS_LINUX_ARM_INLINE_HPP