[PATCH]: Add Hygon Dhyana support
David Holmes
david.holmes at oracle.com
Sat Apr 6 03:55:19 UTC 2019
Hi Fanjinke,
Sorry for the delay in getting to this. I'll help sponsor this for you.
I'll file a bug, import the patch and generate a webrev so that it can
be reviewed more easily (the webrev on github can't be used as it must
be hosted on an OpenJDK site for legal reasons).
Cheers,
David
On 3/04/2019 5:20 pm, Jinke Fan wrote:
> Hello All,
>
> This patch is used to support Hygon Dhyana x86 vendor id (HygonGenuine).
> As Hygon Dhyana CPU share most architecture feature same as AMD Family
> 17h, the patch adds Hygon CPU Vendor ID check to reuse AMD code paths.
>
> Background:
> Chengdu Haiguang IC Design Co., Ltd (Hygon) is a Joint Venture
> between AMD and Haiguang Information Technology Co.,Ltd., aims at
> providing high performance x86 processor for China server market.
> Its first generation processor codename is Dhyana, which
> originates from AMD technology and shares most of the
> architecture with AMD's family 17h, but with different CPU Vendor
> ID("HygonGenuine")/Family series number(Family 18h).
>
> The patch is based on the original repository:
> hg.openjdk.java.net/jdk/jdk
>
> changeset: 54384:cd3b7ad53265
> tag: tip
> user: kvn
> date: Tue Apr 02 09:45:52 2019 -0700
> summary: 8221782: [Graal] Module jdk.internal.vm.compiler.management
> has not been granted accessClassInPackage.jdk.vm.ci.services
>
> Please help me with the commit process.
> Thank you very much!
>
> *patch
> Webrev:
> https://fjkbo.github.io/openjdk/webrev/index.html
>
> The output of hg diff -g:
> diff --git a/src/hotspot/cpu/x86/assembler_x86.cpp
> b/src/hotspot/cpu/x86/assembler_x86.cpp
> --- a/src/hotspot/cpu/x86/assembler_x86.cpp
> +++ b/src/hotspot/cpu/x86/assembler_x86.cpp
> @@ -3099,7 +3099,7 @@
> }
> return;
> }
> - if (UseAddressNop && VM_Version::is_amd()) {
> + if (UseAddressNop && (VM_Version::is_amd() || VM_Version::is_hygon())) {
> //
> // Using multi-bytes nops "0x0F 0x1F [address]" for AMD.
> // 1: 0x90
> diff --git a/src/hotspot/cpu/x86/vm_version_ext_x86.cpp
> b/src/hotspot/cpu/x86/vm_version_ext_x86.cpp
> --- a/src/hotspot/cpu/x86/vm_version_ext_x86.cpp
> +++ b/src/hotspot/cpu/x86/vm_version_ext_x86.cpp
> @@ -340,6 +340,10 @@
> return !is_amd_Barcelona();
> }
>
> + if (is_hygon()) {
> + return true;
> + }
> +
> return false;
> }
>
> diff --git a/src/hotspot/cpu/x86/vm_version_x86.cpp
> b/src/hotspot/cpu/x86/vm_version_x86.cpp
> --- a/src/hotspot/cpu/x86/vm_version_x86.cpp
> +++ b/src/hotspot/cpu/x86/vm_version_x86.cpp
> @@ -1165,7 +1165,7 @@
> }
> }
>
> - if( is_amd() ) { // AMD cpus specific settings
> + if( is_amd() || is_hygon() ) { // AMD cpus specific settings
> if( supports_sse2() && FLAG_IS_DEFAULT(UseAddressNop) ) {
> // Use it on new AMD cpus starting from Opteron.
> UseAddressNop = true;
> @@ -1239,8 +1239,8 @@
> }
> #endif // COMPILER2
>
> - // Some defaults for AMD family 17h
> - if ( cpu_family() == 0x17 ) {
> + // Some defaults for AMD family 17h || Hygon family 18h
> + if ( cpu_family() == 0x17 || cpu_family() == 0x18 ) {
> // On family 17h processors use XMM and UnalignedLoadStores for
> Array Copy
> if (supports_sse2() && FLAG_IS_DEFAULT(UseXMMForArrayCopy)) {
> FLAG_SET_DEFAULT(UseXMMForArrayCopy, true);
> diff --git a/src/hotspot/cpu/x86/vm_version_x86.hpp
> b/src/hotspot/cpu/x86/vm_version_x86.hpp
> --- a/src/hotspot/cpu/x86/vm_version_x86.hpp
> +++ b/src/hotspot/cpu/x86/vm_version_x86.hpp
> @@ -495,13 +495,13 @@
> result |= CPU_CX8;
> if (_cpuid_info.std_cpuid1_edx.bits.cmov != 0)
> result |= CPU_CMOV;
> - if (_cpuid_info.std_cpuid1_edx.bits.fxsr != 0 || (is_amd() &&
> + if (_cpuid_info.std_cpuid1_edx.bits.fxsr != 0 || ((is_amd() ||
> is_hygon()) &&
> _cpuid_info.ext_cpuid1_edx.bits.fxsr != 0))
> result |= CPU_FXSR;
> // HT flag is set for multi-core processors also.
> if (threads_per_core() > 1)
> result |= CPU_HT;
> - if (_cpuid_info.std_cpuid1_edx.bits.mmx != 0 || (is_amd() &&
> + if (_cpuid_info.std_cpuid1_edx.bits.mmx != 0 || ((is_amd() ||
> is_hygon()) &&
> _cpuid_info.ext_cpuid1_edx.bits.mmx != 0))
> result |= CPU_MMX;
> if (_cpuid_info.std_cpuid1_edx.bits.sse != 0)
> @@ -576,8 +576,8 @@
> if (_cpuid_info.std_cpuid1_ecx.bits.fma != 0)
> result |= CPU_FMA;
>
> - // AMD features.
> - if (is_amd()) {
> + // AMD|Hygon features.
> + if (is_amd() || is_hygon()) {
> if ((_cpuid_info.ext_cpuid1_edx.bits.tdnow != 0) ||
> (_cpuid_info.ext_cpuid1_ecx.bits.prefetchw != 0))
> result |= CPU_3DNOW_PREFETCH;
> @@ -711,6 +711,7 @@
> static int cpu_family() { return _cpu;}
> static bool is_P6() { return cpu_family() >= 6; }
> static bool is_amd() { assert_is_initialized(); return
> _cpuid_info.std_vendor_name_0 == 0x68747541; } // 'htuA'
> + static bool is_hygon() { assert_is_initialized(); return
> _cpuid_info.std_vendor_name_0 == 0x6F677948; } // 'ogyH'
> static bool is_intel() { assert_is_initialized(); return
> _cpuid_info.std_vendor_name_0 == 0x756e6547; } // 'uneG'
> static bool is_zx() { assert_is_initialized(); return
> (_cpuid_info.std_vendor_name_0 == 0x746e6543) ||
> (_cpuid_info.std_vendor_name_0 == 0x68532020); } // 'tneC'||'hS '
> static bool is_atom_family() { return ((cpu_family() == 0x06) &&
> ((extended_cpu_model() == 0x36) || (extended_cpu_model() == 0x37) ||
> (extended_cpu_model() == 0x4D))); } //Silvermont and Centerton
> @@ -734,7 +735,7 @@
> if (!supports_topology || result == 0) {
> result = (_cpuid_info.dcp_cpuid4_eax.bits.cores_per_cpu + 1);
> }
> - } else if (is_amd()) {
> + } else if (is_amd() || is_hygon()) {
> result = (_cpuid_info.ext_cpuid8_ecx.bits.cores_per_cpu + 1);
> } else if (is_zx()) {
> bool supports_topology = supports_processor_topology();
> @@ -770,7 +771,7 @@
> intx result = 0;
> if (is_intel()) {
> result = (_cpuid_info.dcp_cpuid4_ebx.bits.L1_line_size + 1);
> - } else if (is_amd()) {
> + } else if (is_amd() || is_hygon()) {
> result = _cpuid_info.ext_cpuid5_ecx.bits.L1_line_size;
> } else if (is_zx()) {
> result = (_cpuid_info.dcp_cpuid4_ebx.bits.L1_line_size + 1);
> @@ -857,7 +858,7 @@
>
> // AMD features
> static bool supports_3dnow_prefetch() { return (_features &
> CPU_3DNOW_PREFETCH) != 0; }
> - static bool supports_mmx_ext() { return is_amd() &&
> _cpuid_info.ext_cpuid1_edx.bits.mmx_amd != 0; }
> + static bool supports_mmx_ext() { return (is_amd()||is_hygon()) &&
> _cpuid_info.ext_cpuid1_edx.bits.mmx_amd != 0; }
> static bool supports_lzcnt() { return (_features & CPU_LZCNT) !=
> 0; }
> static bool supports_sse4a() { return (_features & CPU_SSE4A) !=
> 0; }
>
> @@ -870,7 +871,7 @@
> }
> static bool supports_tscinv() {
> return supports_tscinv_bit() &&
> - ( (is_amd() && !is_amd_Barcelona()) ||
> + ( ((is_amd()||is_hygon()) && !is_amd_Barcelona()) ||
> is_intel_tsc_synched_at_init() );
> }
>
> @@ -896,7 +897,7 @@
> // Core - 256 / prefetchnta
> // It will be used only when AllocatePrefetchStyle > 0
>
> - if (is_amd()) { // AMD
> + if (is_amd() || is_hygon()) { // AMD
> if (supports_sse2()) {
> return 256; // Opteron
> } else {
>
> *test
> I tested it with jtreg and found no regressions.
>
> Base Run:
> ==============================
> Test summary
> ==============================
> TEST TOTAL PASS FAIL ERROR
> jtreg:test/hotspot/jtreg:tier1 1396 1396 0 0
>>> jtreg:test/jdk:tier1 1867 1866 1 0 <<
>>> jtreg:test/langtools:tier1 3920 3919 1 0 <<
> jtreg:test/nashorn:tier1 0 0 0 0
> jtreg:test/jaxp:tier1 0 0 0 0
> ==============================
> TEST FAILURE
>
> And The result of after patching is the same as the before.
> ==============================
> Test summary
> ==============================
> TEST TOTAL PASS FAIL ERROR
> jtreg:test/hotspot/jtreg:tier1 1396 1396 0 0
>>> jtreg:test/jdk:tier1 1867 1866 1 0 <<
>>> jtreg:test/langtools:tier1 3920 3919 1 0 <<
> jtreg:test/nashorn:tier1 0 0 0 0
> jtreg:test/jaxp:tier1 0 0 0 0
> ==============================
> TEST FAILURE
>
> Is there anything incorrectly?
> Please let me know your comments.
>
> Best Regards!
> Fanjinke.
>
More information about the hotspot-dev
mailing list