src/hotspot/cpu/x86/vm_version_x86.cpp
author rkennke
Tue, 25 Sep 2018 16:41:25 +0200
changeset 51868 92960b0e6191
parent 51857 9978fea8a371
child 51976 390f529f4f22
permissions -rw-r--r--
8211061: Tests fail with assert(VM_Version::supports_sse4_1()) on ThreadRipper CPU Reviewed-by: thartmann, roland
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
     1
/*
48489
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
     2
 * Copyright (c) 1997, 2018, Oracle and/or its affiliates. All rights reserved.
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
     3
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
     4
 *
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
     5
 * This code is free software; you can redistribute it and/or modify it
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
     6
 * under the terms of the GNU General Public License version 2 only, as
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
     7
 * published by the Free Software Foundation.
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
     8
 *
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
     9
 * This code is distributed in the hope that it will be useful, but WITHOUT
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    10
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    11
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    12
 * version 2 for more details (a copy is included in the LICENSE file that
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    13
 * accompanied this code).
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    14
 *
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    15
 * You should have received a copy of the GNU General Public License version
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    16
 * 2 along with this work; if not, write to the Free Software Foundation,
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    17
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    18
 *
5547
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 4430
diff changeset
    19
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 4430
diff changeset
    20
 * or visit www.oracle.com if you need additional information or have any
f4b087cbb361 6941466: Oracle rebranding changes for Hotspot repositories
trims
parents: 4430
diff changeset
    21
 * questions.
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    22
 *
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    23
 */
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    24
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6418
diff changeset
    25
#include "precompiled.hpp"
47765
b7c7428eaab9 8189610: Reconcile jvm.h and all jvm_md.h between java.base and hotspot
coleenp
parents: 47582
diff changeset
    26
#include "jvm.h"
14626
0cf4eccf130f 8003240: x86: move MacroAssembler into separate file
twisti
parents: 14394
diff changeset
    27
#include "asm/macroAssembler.hpp"
0cf4eccf130f 8003240: x86: move MacroAssembler into separate file
twisti
parents: 14394
diff changeset
    28
#include "asm/macroAssembler.inline.hpp"
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
    29
#include "logging/log.hpp"
46701
f559541c0daa 8181917: Refactor UL LogStreams to avoid using resource area
stuefe
parents: 46698
diff changeset
    30
#include "logging/logStream.hpp"
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6418
diff changeset
    31
#include "memory/resourceArea.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6418
diff changeset
    32
#include "runtime/java.hpp"
25949
34557722059b 6424123: JVM crashes on failed 'strdup' call
zgu
parents: 25932
diff changeset
    33
#include "runtime/os.hpp"
7397
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6418
diff changeset
    34
#include "runtime/stubCodeGenerator.hpp"
5b173b4ca846 6989984: Use standard include model for Hospot
stefank
parents: 6418
diff changeset
    35
#include "vm_version_x86.hpp"
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    36
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    37
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    38
int VM_Version::_cpu;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    39
int VM_Version::_model;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    40
int VM_Version::_stepping;
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
    41
VM_Version::CpuidInfo VM_Version::_cpuid_info = { 0, };
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    42
23487
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
    43
// Address of instruction which causes SEGV
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
    44
address VM_Version::_cpuinfo_segv_addr = 0;
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
    45
// Address of instruction after the one which causes SEGV
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
    46
address VM_Version::_cpuinfo_cont_addr = 0;
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
    47
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    48
static BufferBlob* stub_blob;
47582
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
    49
static const int stub_size = 1100;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    50
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    51
extern "C" {
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
    52
  typedef void (*get_cpu_info_stub_t)(void*);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    53
}
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
    54
static get_cpu_info_stub_t get_cpu_info_stub = NULL;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    55
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    56
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    57
class VM_Version_StubGenerator: public StubCodeGenerator {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    58
 public:
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    59
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    60
  VM_Version_StubGenerator(CodeBuffer *c) : StubCodeGenerator(c) {}
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    61
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
    62
  address generate_get_cpu_info() {
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    63
    // Flags to test CPU type.
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
    64
    const uint32_t HS_EFL_AC = 0x40000;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
    65
    const uint32_t HS_EFL_ID = 0x200000;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    66
    // Values for when we don't have a CPUID instruction.
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    67
    const int      CPU_FAMILY_SHIFT = 8;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
    68
    const uint32_t CPU_FAMILY_386 = (3 << CPU_FAMILY_SHIFT);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
    69
    const uint32_t CPU_FAMILY_486 = (4 << CPU_FAMILY_SHIFT);
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
    70
    bool use_evex = FLAG_IS_DEFAULT(UseAVX) || (UseAVX > 2);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    71
5902
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
    72
    Label detect_486, cpu486, detect_586, std_cpuid1, std_cpuid4;
47582
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
    73
    Label sef_cpuid, ext_cpuid, ext_cpuid1, ext_cpuid5, ext_cpuid7, ext_cpuid8, done, wrapup;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
    74
    Label legacy_setup, save_restore_except, legacy_save_restore, start_simd_check;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    75
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
    76
    StubCodeMark mark(this, "VM_Version", "get_cpu_info_stub");
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    77
#   define __ _masm->
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    78
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    79
    address start = __ pc();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    80
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    81
    //
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
    82
    // void get_cpu_info(VM_Version::CpuidInfo* cpuid_info);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    83
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    84
    // LP64: rcx and rdx are first and second argument registers on windows
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    85
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    86
    __ push(rbp);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    87
#ifdef _LP64
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    88
    __ mov(rbp, c_rarg0); // cpuid_info address
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    89
#else
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    90
    __ movptr(rbp, Address(rsp, 8)); // cpuid_info address
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    91
#endif
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    92
    __ push(rbx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    93
    __ push(rsi);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    94
    __ pushf();          // preserve rbx, and flags
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    95
    __ pop(rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    96
    __ push(rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    97
    __ mov(rcx, rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    98
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
    99
    // if we are unable to change the AC flag, we have a 386
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   100
    //
11881
9642744ae9a5 7132070: Use a mach_port_t as the OSThread thread_id rather than pthread_t on BSD/OSX
sla
parents: 11439
diff changeset
   101
    __ xorl(rax, HS_EFL_AC);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   102
    __ push(rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   103
    __ popf();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   104
    __ pushf();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   105
    __ pop(rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   106
    __ cmpptr(rax, rcx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   107
    __ jccb(Assembler::notEqual, detect_486);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   108
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   109
    __ movl(rax, CPU_FAMILY_386);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   110
    __ movl(Address(rbp, in_bytes(VM_Version::std_cpuid1_offset())), rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   111
    __ jmp(done);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   112
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   113
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   114
    // If we are unable to change the ID flag, we have a 486 which does
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   115
    // not support the "cpuid" instruction.
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   116
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   117
    __ bind(detect_486);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   118
    __ mov(rax, rcx);
11881
9642744ae9a5 7132070: Use a mach_port_t as the OSThread thread_id rather than pthread_t on BSD/OSX
sla
parents: 11439
diff changeset
   119
    __ xorl(rax, HS_EFL_ID);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   120
    __ push(rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   121
    __ popf();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   122
    __ pushf();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   123
    __ pop(rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   124
    __ cmpptr(rcx, rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   125
    __ jccb(Assembler::notEqual, detect_586);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   126
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   127
    __ bind(cpu486);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   128
    __ movl(rax, CPU_FAMILY_486);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   129
    __ movl(Address(rbp, in_bytes(VM_Version::std_cpuid1_offset())), rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   130
    __ jmp(done);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   131
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   132
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   133
    // At this point, we have a chip which supports the "cpuid" instruction
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   134
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   135
    __ bind(detect_586);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   136
    __ xorl(rax, rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   137
    __ cpuid();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   138
    __ orl(rax, rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   139
    __ jcc(Assembler::equal, cpu486);   // if cpuid doesn't support an input
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   140
                                        // value of at least 1, we give up and
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   141
                                        // assume a 486
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   142
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::std_cpuid0_offset())));
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   143
    __ movl(Address(rsi, 0), rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   144
    __ movl(Address(rsi, 4), rbx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   145
    __ movl(Address(rsi, 8), rcx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   146
    __ movl(Address(rsi,12), rdx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   147
5902
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   148
    __ cmpl(rax, 0xa);                  // Is cpuid(0xB) supported?
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   149
    __ jccb(Assembler::belowEqual, std_cpuid4);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   150
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   151
    //
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   152
    // cpuid(0xB) Processor Topology
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   153
    //
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   154
    __ movl(rax, 0xb);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   155
    __ xorl(rcx, rcx);   // Threads level
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   156
    __ cpuid();
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   157
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   158
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::tpl_cpuidB0_offset())));
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   159
    __ movl(Address(rsi, 0), rax);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   160
    __ movl(Address(rsi, 4), rbx);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   161
    __ movl(Address(rsi, 8), rcx);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   162
    __ movl(Address(rsi,12), rdx);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   163
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   164
    __ movl(rax, 0xb);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   165
    __ movl(rcx, 1);     // Cores level
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   166
    __ cpuid();
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   167
    __ push(rax);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   168
    __ andl(rax, 0x1f);  // Determine if valid topology level
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   169
    __ orl(rax, rbx);    // eax[4:0] | ebx[0:15] == 0 indicates invalid level
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   170
    __ andl(rax, 0xffff);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   171
    __ pop(rax);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   172
    __ jccb(Assembler::equal, std_cpuid4);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   173
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   174
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::tpl_cpuidB1_offset())));
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   175
    __ movl(Address(rsi, 0), rax);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   176
    __ movl(Address(rsi, 4), rbx);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   177
    __ movl(Address(rsi, 8), rcx);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   178
    __ movl(Address(rsi,12), rdx);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   179
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   180
    __ movl(rax, 0xb);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   181
    __ movl(rcx, 2);     // Packages level
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   182
    __ cpuid();
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   183
    __ push(rax);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   184
    __ andl(rax, 0x1f);  // Determine if valid topology level
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   185
    __ orl(rax, rbx);    // eax[4:0] | ebx[0:15] == 0 indicates invalid level
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   186
    __ andl(rax, 0xffff);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   187
    __ pop(rax);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   188
    __ jccb(Assembler::equal, std_cpuid4);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   189
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   190
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::tpl_cpuidB2_offset())));
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   191
    __ movl(Address(rsi, 0), rax);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   192
    __ movl(Address(rsi, 4), rbx);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   193
    __ movl(Address(rsi, 8), rcx);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   194
    __ movl(Address(rsi,12), rdx);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   195
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   196
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   197
    // cpuid(0x4) Deterministic cache params
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   198
    //
5902
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   199
    __ bind(std_cpuid4);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   200
    __ movl(rax, 4);
5902
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   201
    __ cmpl(rax, Address(rbp, in_bytes(VM_Version::std_cpuid0_offset()))); // Is cpuid(0x4) supported?
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   202
    __ jccb(Assembler::greater, std_cpuid1);
ba0c3b725081 6964774: Adjust optimization flags setting
kvn
parents: 5547
diff changeset
   203
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   204
    __ xorl(rcx, rcx);   // L1 cache
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   205
    __ cpuid();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   206
    __ push(rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   207
    __ andl(rax, 0x1f);  // Determine if valid cache parameters used
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   208
    __ orl(rax, rax);    // eax[4:0] == 0 indicates invalid cache
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   209
    __ pop(rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   210
    __ jccb(Assembler::equal, std_cpuid1);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   211
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   212
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::dcp_cpuid4_offset())));
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   213
    __ movl(Address(rsi, 0), rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   214
    __ movl(Address(rsi, 4), rbx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   215
    __ movl(Address(rsi, 8), rcx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   216
    __ movl(Address(rsi,12), rdx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   217
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   218
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   219
    // Standard cpuid(0x1)
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   220
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   221
    __ bind(std_cpuid1);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   222
    __ movl(rax, 1);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   223
    __ cpuid();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   224
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::std_cpuid1_offset())));
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   225
    __ movl(Address(rsi, 0), rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   226
    __ movl(Address(rsi, 4), rbx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   227
    __ movl(Address(rsi, 8), rcx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   228
    __ movl(Address(rsi,12), rdx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   229
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   230
    //
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   231
    // Check if OS has enabled XGETBV instruction to access XCR0
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   232
    // (OSXSAVE feature flag) and CPU supports AVX
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   233
    //
23487
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
   234
    __ andl(rcx, 0x18000000); // cpuid1 bits osxsave | avx
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   235
    __ cmpl(rcx, 0x18000000);
23487
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
   236
    __ jccb(Assembler::notEqual, sef_cpuid); // jump if AVX is not supported
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   237
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   238
    //
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   239
    // XCR0, XFEATURE_ENABLED_MASK register
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   240
    //
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   241
    __ xorl(rcx, rcx);   // zero for XCR0 register
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   242
    __ xgetbv();
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   243
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::xem_xcr0_offset())));
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   244
    __ movl(Address(rsi, 0), rax);
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   245
    __ movl(Address(rsi, 4), rdx);
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   246
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   247
    //
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   248
    // cpuid(0x7) Structured Extended Features
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   249
    //
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   250
    __ bind(sef_cpuid);
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   251
    __ movl(rax, 7);
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   252
    __ cmpl(rax, Address(rbp, in_bytes(VM_Version::std_cpuid0_offset()))); // Is cpuid(0x7) supported?
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   253
    __ jccb(Assembler::greater, ext_cpuid);
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   254
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   255
    __ xorl(rcx, rcx);
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   256
    __ cpuid();
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   257
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::sef_cpuid7_offset())));
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   258
    __ movl(Address(rsi, 0), rax);
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   259
    __ movl(Address(rsi, 4), rbx);
49384
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48490
diff changeset
   260
    __ movl(Address(rsi, 8), rcx);
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48490
diff changeset
   261
    __ movl(Address(rsi, 12), rdx);
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   262
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   263
    //
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   264
    // Extended cpuid(0x80000000)
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   265
    //
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   266
    __ bind(ext_cpuid);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   267
    __ movl(rax, 0x80000000);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   268
    __ cpuid();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   269
    __ cmpl(rax, 0x80000000);     // Is cpuid(0x80000001) supported?
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   270
    __ jcc(Assembler::belowEqual, done);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   271
    __ cmpl(rax, 0x80000004);     // Is cpuid(0x80000005) supported?
47582
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   272
    __ jcc(Assembler::belowEqual, ext_cpuid1);
11417
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   273
    __ cmpl(rax, 0x80000006);     // Is cpuid(0x80000007) supported?
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   274
    __ jccb(Assembler::belowEqual, ext_cpuid5);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   275
    __ cmpl(rax, 0x80000007);     // Is cpuid(0x80000008) supported?
11417
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   276
    __ jccb(Assembler::belowEqual, ext_cpuid7);
47582
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   277
    __ cmpl(rax, 0x80000008);     // Is cpuid(0x80000009 and above) supported?
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   278
    __ jccb(Assembler::belowEqual, ext_cpuid8);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   279
    __ cmpl(rax, 0x8000001E);     // Is cpuid(0x8000001E) supported?
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   280
    __ jccb(Assembler::below, ext_cpuid8);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   281
    //
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   282
    // Extended cpuid(0x8000001E)
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   283
    //
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   284
    __ movl(rax, 0x8000001E);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   285
    __ cpuid();
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   286
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::ext_cpuid1E_offset())));
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   287
    __ movl(Address(rsi, 0), rax);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   288
    __ movl(Address(rsi, 4), rbx);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   289
    __ movl(Address(rsi, 8), rcx);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   290
    __ movl(Address(rsi,12), rdx);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   291
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   292
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   293
    // Extended cpuid(0x80000008)
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   294
    //
47582
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
   295
    __ bind(ext_cpuid8);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   296
    __ movl(rax, 0x80000008);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   297
    __ cpuid();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   298
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::ext_cpuid8_offset())));
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   299
    __ movl(Address(rsi, 0), rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   300
    __ movl(Address(rsi, 4), rbx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   301
    __ movl(Address(rsi, 8), rcx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   302
    __ movl(Address(rsi,12), rdx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   303
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   304
    //
11417
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   305
    // Extended cpuid(0x80000007)
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   306
    //
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   307
    __ bind(ext_cpuid7);
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   308
    __ movl(rax, 0x80000007);
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   309
    __ cpuid();
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   310
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::ext_cpuid7_offset())));
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   311
    __ movl(Address(rsi, 0), rax);
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   312
    __ movl(Address(rsi, 4), rbx);
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   313
    __ movl(Address(rsi, 8), rcx);
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   314
    __ movl(Address(rsi,12), rdx);
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   315
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   316
    //
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   317
    // Extended cpuid(0x80000005)
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   318
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   319
    __ bind(ext_cpuid5);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   320
    __ movl(rax, 0x80000005);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   321
    __ cpuid();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   322
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::ext_cpuid5_offset())));
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   323
    __ movl(Address(rsi, 0), rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   324
    __ movl(Address(rsi, 4), rbx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   325
    __ movl(Address(rsi, 8), rcx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   326
    __ movl(Address(rsi,12), rdx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   327
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   328
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   329
    // Extended cpuid(0x80000001)
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   330
    //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   331
    __ bind(ext_cpuid1);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   332
    __ movl(rax, 0x80000001);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   333
    __ cpuid();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   334
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::ext_cpuid1_offset())));
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   335
    __ movl(Address(rsi, 0), rax);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   336
    __ movl(Address(rsi, 4), rbx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   337
    __ movl(Address(rsi, 8), rcx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   338
    __ movl(Address(rsi,12), rdx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   339
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   340
    //
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   341
    // Check if OS has enabled XGETBV instruction to access XCR0
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   342
    // (OSXSAVE feature flag) and CPU supports AVX
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   343
    //
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   344
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::std_cpuid1_offset())));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   345
    __ movl(rcx, 0x18000000); // cpuid1 bits osxsave | avx
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   346
    __ andl(rcx, Address(rsi, 8)); // cpuid1 bits osxsave | avx
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   347
    __ cmpl(rcx, 0x18000000);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   348
    __ jccb(Assembler::notEqual, done); // jump if AVX is not supported
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   349
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   350
    __ movl(rax, 0x6);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   351
    __ andl(rax, Address(rbp, in_bytes(VM_Version::xem_xcr0_offset()))); // xcr0 bits sse | ymm
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   352
    __ cmpl(rax, 0x6);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   353
    __ jccb(Assembler::equal, start_simd_check); // return if AVX is not supported
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   354
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   355
    // we need to bridge farther than imm8, so we use this island as a thunk
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   356
    __ bind(done);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   357
    __ jmp(wrapup);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   358
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   359
    __ bind(start_simd_check);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   360
    //
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   361
    // Some OSs have a bug when upper 128/256bits of YMM/ZMM
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   362
    // registers are not restored after a signal processing.
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   363
    // Generate SEGV here (reference through NULL)
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   364
    // and check upper YMM/ZMM bits after it.
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   365
    //
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   366
    intx saved_useavx = UseAVX;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   367
    intx saved_usesse = UseSSE;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   368
    // check _cpuid_info.sef_cpuid7_ebx.bits.avx512f
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   369
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::sef_cpuid7_offset())));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   370
    __ movl(rax, 0x10000);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   371
    __ andl(rax, Address(rsi, 4)); // xcr0 bits sse | ymm
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   372
    __ cmpl(rax, 0x10000);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   373
    __ jccb(Assembler::notEqual, legacy_setup); // jump if EVEX is not supported
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   374
    // check _cpuid_info.xem_xcr0_eax.bits.opmask
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   375
    // check _cpuid_info.xem_xcr0_eax.bits.zmm512
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   376
    // check _cpuid_info.xem_xcr0_eax.bits.zmm32
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   377
    __ movl(rax, 0xE0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   378
    __ andl(rax, Address(rbp, in_bytes(VM_Version::xem_xcr0_offset()))); // xcr0 bits sse | ymm
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   379
    __ cmpl(rax, 0xE0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   380
    __ jccb(Assembler::notEqual, legacy_setup); // jump if EVEX is not supported
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   381
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   382
    // If UseAVX is unitialized or is set by the user to include EVEX
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   383
    if (use_evex) {
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   384
      // EVEX setup: run in lowest evex mode
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   385
      VM_Version::set_evex_cpuFeatures(); // Enable temporary to pass asserts
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   386
      UseAVX = 3;
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   387
      UseSSE = 2;
42076
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   388
#ifdef _WINDOWS
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   389
      // xmm5-xmm15 are not preserved by caller on windows
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   390
      // https://msdn.microsoft.com/en-us/library/9z1stfyw.aspx
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   391
      __ subptr(rsp, 64);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   392
      __ evmovdqul(Address(rsp, 0), xmm7, Assembler::AVX_512bit);
42076
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   393
#ifdef _LP64
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   394
      __ subptr(rsp, 64);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   395
      __ evmovdqul(Address(rsp, 0), xmm8, Assembler::AVX_512bit);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   396
      __ subptr(rsp, 64);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   397
      __ evmovdqul(Address(rsp, 0), xmm31, Assembler::AVX_512bit);
42076
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   398
#endif // _LP64
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   399
#endif // _WINDOWS
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   400
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   401
      // load value into all 64 bytes of zmm7 register
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   402
      __ movl(rcx, VM_Version::ymm_test_value());
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   403
      __ movdl(xmm0, rcx);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   404
      __ movl(rcx, 0xffff);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   405
      __ kmovwl(k1, rcx);
51857
9978fea8a371 8210764: Update avx512 implementation
kvn
parents: 50860
diff changeset
   406
      __ vpbroadcastd(xmm0, xmm0, Assembler::AVX_512bit);
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   407
      __ evmovdqul(xmm7, xmm0, Assembler::AVX_512bit);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   408
#ifdef _LP64
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   409
      __ evmovdqul(xmm8, xmm0, Assembler::AVX_512bit);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   410
      __ evmovdqul(xmm31, xmm0, Assembler::AVX_512bit);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   411
#endif
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   412
      VM_Version::clean_cpuFeatures();
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   413
      __ jmp(save_restore_except);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   414
    }
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   415
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   416
    __ bind(legacy_setup);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   417
    // AVX setup
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   418
    VM_Version::set_avx_cpuFeatures(); // Enable temporary to pass asserts
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   419
    UseAVX = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   420
    UseSSE = 2;
42076
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   421
#ifdef _WINDOWS
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   422
    __ subptr(rsp, 32);
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   423
    __ vmovdqu(Address(rsp, 0), xmm7);
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   424
#ifdef _LP64
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   425
    __ subptr(rsp, 32);
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   426
    __ vmovdqu(Address(rsp, 0), xmm8);
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   427
    __ subptr(rsp, 32);
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   428
    __ vmovdqu(Address(rsp, 0), xmm15);
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   429
#endif // _LP64
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   430
#endif // _WINDOWS
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   431
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   432
    // load value into all 32 bytes of ymm7 register
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   433
    __ movl(rcx, VM_Version::ymm_test_value());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   434
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   435
    __ movdl(xmm0, rcx);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   436
    __ pshufd(xmm0, xmm0, 0x00);
36561
b18243f4d955 8151002: Make Assembler methods vextract and vinsert match actual instructions
mikael
parents: 36555
diff changeset
   437
    __ vinsertf128_high(xmm0, xmm0);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   438
    __ vmovdqu(xmm7, xmm0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   439
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   440
    __ vmovdqu(xmm8, xmm0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   441
    __ vmovdqu(xmm15, xmm0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   442
#endif
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   443
    VM_Version::clean_cpuFeatures();
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   444
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   445
    __ bind(save_restore_except);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   446
    __ xorl(rsi, rsi);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   447
    VM_Version::set_cpuinfo_segv_addr(__ pc());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   448
    // Generate SEGV
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   449
    __ movl(rax, Address(rsi, 0));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   450
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   451
    VM_Version::set_cpuinfo_cont_addr(__ pc());
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   452
    // Returns here after signal. Save xmm0 to check it later.
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   453
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   454
    // check _cpuid_info.sef_cpuid7_ebx.bits.avx512f
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   455
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::sef_cpuid7_offset())));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   456
    __ movl(rax, 0x10000);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   457
    __ andl(rax, Address(rsi, 4));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   458
    __ cmpl(rax, 0x10000);
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   459
    __ jcc(Assembler::notEqual, legacy_save_restore);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   460
    // check _cpuid_info.xem_xcr0_eax.bits.opmask
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   461
    // check _cpuid_info.xem_xcr0_eax.bits.zmm512
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   462
    // check _cpuid_info.xem_xcr0_eax.bits.zmm32
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   463
    __ movl(rax, 0xE0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   464
    __ andl(rax, Address(rbp, in_bytes(VM_Version::xem_xcr0_offset()))); // xcr0 bits sse | ymm
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   465
    __ cmpl(rax, 0xE0);
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   466
    __ jcc(Assembler::notEqual, legacy_save_restore);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   467
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   468
    // If UseAVX is unitialized or is set by the user to include EVEX
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   469
    if (use_evex) {
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   470
      // EVEX check: run in lowest evex mode
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   471
      VM_Version::set_evex_cpuFeatures(); // Enable temporary to pass asserts
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   472
      UseAVX = 3;
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   473
      UseSSE = 2;
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   474
      __ lea(rsi, Address(rbp, in_bytes(VM_Version::zmm_save_offset())));
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   475
      __ evmovdqul(Address(rsi, 0), xmm0, Assembler::AVX_512bit);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   476
      __ evmovdqul(Address(rsi, 64), xmm7, Assembler::AVX_512bit);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   477
#ifdef _LP64
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   478
      __ evmovdqul(Address(rsi, 128), xmm8, Assembler::AVX_512bit);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   479
      __ evmovdqul(Address(rsi, 192), xmm31, Assembler::AVX_512bit);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   480
#endif
42076
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   481
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   482
#ifdef _WINDOWS
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   483
#ifdef _LP64
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   484
      __ evmovdqul(xmm31, Address(rsp, 0), Assembler::AVX_512bit);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   485
      __ addptr(rsp, 64);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   486
      __ evmovdqul(xmm8, Address(rsp, 0), Assembler::AVX_512bit);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   487
      __ addptr(rsp, 64);
42076
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   488
#endif // _LP64
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   489
      __ evmovdqul(xmm7, Address(rsp, 0), Assembler::AVX_512bit);
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   490
      __ addptr(rsp, 64);
42076
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   491
#endif // _WINDOWS
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   492
      generate_vzeroupper(wrapup);
42586
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   493
      VM_Version::clean_cpuFeatures();
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   494
      UseAVX = saved_useavx;
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   495
      UseSSE = saved_usesse;
e14fee6a1839 8170039: Change UseAVX < 3 on SKX/KNL to not emit evex vector check
mcberg
parents: 42076
diff changeset
   496
      __ jmp(wrapup);
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   497
   }
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   498
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   499
    __ bind(legacy_save_restore);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   500
    // AVX check
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   501
    VM_Version::set_avx_cpuFeatures(); // Enable temporary to pass asserts
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   502
    UseAVX = 1;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   503
    UseSSE = 2;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   504
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::ymm_save_offset())));
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   505
    __ vmovdqu(Address(rsi, 0), xmm0);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   506
    __ vmovdqu(Address(rsi, 32), xmm7);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   507
#ifdef _LP64
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   508
    __ vmovdqu(Address(rsi, 64), xmm8);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   509
    __ vmovdqu(Address(rsi, 96), xmm15);
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   510
#endif
42076
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   511
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   512
#ifdef _WINDOWS
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   513
#ifdef _LP64
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   514
    __ vmovdqu(xmm15, Address(rsp, 0));
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   515
    __ addptr(rsp, 32);
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   516
    __ vmovdqu(xmm8, Address(rsp, 0));
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   517
    __ addptr(rsp, 32);
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   518
#endif // _LP64
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   519
    __ vmovdqu(xmm7, Address(rsp, 0));
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   520
    __ addptr(rsp, 32);
d6c3ecec1d34 8067744: XMM/SSE float register values corrupted by JNI_CreateVM call in JRE 8 (Windows)
kvn
parents: 42039
diff changeset
   521
#endif // _WINDOWS
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   522
    generate_vzeroupper(wrapup);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   523
    VM_Version::clean_cpuFeatures();
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   524
    UseAVX = saved_useavx;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   525
    UseSSE = saved_usesse;
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   526
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   527
    __ bind(wrapup);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   528
    __ popf();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   529
    __ pop(rsi);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   530
    __ pop(rbx);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   531
    __ pop(rbp);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   532
    __ ret(0);
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   533
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   534
#   undef __
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   535
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   536
    return start;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   537
  };
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   538
  void generate_vzeroupper(Label& L_wrapup) {
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   539
#   define __ _masm->
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   540
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::std_cpuid0_offset())));
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   541
    __ cmpl(Address(rsi, 4), 0x756e6547);  // 'uneG'
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   542
    __ jcc(Assembler::notEqual, L_wrapup);
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   543
    __ movl(rcx, 0x0FFF0FF0);
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   544
    __ lea(rsi, Address(rbp, in_bytes(VM_Version::std_cpuid1_offset())));
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   545
    __ andl(rcx, Address(rsi, 0));
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   546
    __ cmpl(rcx, 0x00050670);              // If it is Xeon Phi 3200/5200/7200
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   547
    __ jcc(Assembler::equal, L_wrapup);
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   548
    __ cmpl(rcx, 0x00080650);              // If it is Future Xeon Phi
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   549
    __ jcc(Assembler::equal, L_wrapup);
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   550
    __ vzeroupper();
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   551
#   undef __
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   552
  }
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   553
};
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   554
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   555
void VM_Version::get_processor_features() {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   556
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   557
  _cpu = 4; // 486 by default
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   558
  _model = 0;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   559
  _stepping = 0;
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   560
  _features = 0;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   561
  _logical_processors_per_package = 1;
25633
4cd9c4622c8c 8049717: expose L1_data_cache_line_size for diagnostic/sanity checks
dcubed
parents: 25468
diff changeset
   562
  // i486 internal cache is both I&D and has a 16-byte line size
4cd9c4622c8c 8049717: expose L1_data_cache_line_size for diagnostic/sanity checks
dcubed
parents: 25468
diff changeset
   563
  _L1_data_cache_line_size = 16;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   564
35102
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   565
  // Get raw processor info
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
   566
35102
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   567
  get_cpu_info_stub(&_cpuid_info);
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
   568
35102
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   569
  assert_is_initialized();
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   570
  _cpu = extended_cpu_family();
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   571
  _model = extended_cpu_model();
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   572
  _stepping = cpu_stepping();
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   573
35102
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   574
  if (cpu_family() > 4) { // it supports CPUID
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   575
    _features = feature_flags();
35102
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   576
    // Logical processors are only available on P4s and above,
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   577
    // and only if hyperthreading is available.
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   578
    _logical_processors_per_package = logical_processor_count();
c5f050e1f982 6808665: Use486InstrsOnly aborts 32-bit VM
thartmann
parents: 34207
diff changeset
   579
    _L1_data_cache_line_size = L1_line_size();
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   580
  }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   581
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   582
  _supports_cx8 = supports_cmpxchg8();
13886
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13885
diff changeset
   583
  // xchg and xadd instructions
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13885
diff changeset
   584
  _supports_atomic_getset4 = true;
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13885
diff changeset
   585
  _supports_atomic_getadd4 = true;
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13885
diff changeset
   586
  LP64_ONLY(_supports_atomic_getset8 = true);
8d82c4dfa722 7023898: Intrinsify AtomicLongFieldUpdater.getAndIncrement()
roland
parents: 13885
diff changeset
   587
  LP64_ONLY(_supports_atomic_getadd8 = true);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   588
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   589
#ifdef _LP64
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   590
  // OS should support SSE for x64 and hardware should support at least SSE2.
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   591
  if (!VM_Version::supports_sse2()) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   592
    vm_exit_during_initialization("Unknown x64 processor: SSE2 not supported");
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   593
  }
4430
95b539dfa1e8 6769124: various 64-bit fixes for c1
roland
parents: 2862
diff changeset
   594
  // in 64 bit the use of SSE2 is the minimum
95b539dfa1e8 6769124: various 64-bit fixes for c1
roland
parents: 2862
diff changeset
   595
  if (UseSSE < 2) UseSSE = 2;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   596
#endif
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   597
10010
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   598
#ifdef AMD64
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   599
  // flush_icache_stub have to be generated first.
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   600
  // That is why Icache line size is hard coded in ICache class,
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   601
  // see icache_x86.hpp. It is also the reason why we can't use
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   602
  // clflush instruction in 32-bit VM since it could be running
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   603
  // on CPU which does not support it.
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   604
  //
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   605
  // The only thing we can do is to verify that flushed
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   606
  // ICache::line_size has correct value.
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   607
  guarantee(_cpuid_info.std_cpuid1_edx.bits.clflush != 0, "clflush is not supported");
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   608
  // clflush_size is size in quadwords (8 bytes).
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   609
  guarantee(_cpuid_info.std_cpuid1_ebx.bits.clflush_size == 8, "such clflush size is not supported");
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   610
#endif
72de7c910672 6990015: Incorrect Icache line size is used for 64 bit x86
kvn
parents: 9325
diff changeset
   611
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   612
  // If the OS doesn't support SSE, we can't use this feature even if the HW does
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   613
  if (!os::supports_sse())
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   614
    _features &= ~(CPU_SSE|CPU_SSE2|CPU_SSE3|CPU_SSSE3|CPU_SSE4A|CPU_SSE4_1|CPU_SSE4_2);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   615
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   616
  if (UseSSE < 4) {
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   617
    _features &= ~CPU_SSE4_1;
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   618
    _features &= ~CPU_SSE4_2;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   619
  }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   620
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   621
  if (UseSSE < 3) {
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   622
    _features &= ~CPU_SSE3;
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   623
    _features &= ~CPU_SSSE3;
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   624
    _features &= ~CPU_SSE4A;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   625
  }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   626
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   627
  if (UseSSE < 2)
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   628
    _features &= ~CPU_SSE2;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   629
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   630
  if (UseSSE < 1)
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   631
    _features &= ~CPU_SSE;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   632
48489
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
   633
  //since AVX instructions is slower than SSE in some ZX cpus, force USEAVX=0.
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
   634
  if (is_zx() && ((cpu_family() == 6) || (cpu_family() == 7))) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
   635
    UseAVX = 0;
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
   636
  }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
   637
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   638
  // first try initial setting and detect what we can support
48195
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   639
  int use_avx_limit = 0;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   640
  if (UseAVX > 0) {
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   641
    if (UseAVX > 2 && supports_evex()) {
48195
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   642
      use_avx_limit = 3;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   643
    } else if (UseAVX > 1 && supports_avx2()) {
48195
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   644
      use_avx_limit = 2;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   645
    } else if (UseAVX > 0 && supports_avx()) {
48195
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   646
      use_avx_limit = 1;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   647
    } else {
48195
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   648
      use_avx_limit = 0;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   649
    }
48195
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   650
  }
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   651
  if (FLAG_IS_DEFAULT(UseAVX)) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   652
    FLAG_SET_DEFAULT(UseAVX, use_avx_limit);
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   653
  } else if (UseAVX > use_avx_limit) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   654
    warning("UseAVX=%d is not supported on this CPU, setting it to UseAVX=%d", (int) UseAVX, use_avx_limit);
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   655
    FLAG_SET_DEFAULT(UseAVX, use_avx_limit);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   656
  } else if (UseAVX < 0) {
48195
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   657
    warning("UseAVX=%d is not valid, setting it to UseAVX=0", (int) UseAVX);
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   658
    FLAG_SET_DEFAULT(UseAVX, 0);
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   659
  }
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   660
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   661
  if (UseAVX < 3) {
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   662
    _features &= ~CPU_AVX512F;
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   663
    _features &= ~CPU_AVX512DQ;
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   664
    _features &= ~CPU_AVX512CD;
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   665
    _features &= ~CPU_AVX512BW;
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   666
    _features &= ~CPU_AVX512VL;
49384
b242a1e3f9cf 8199421: Add support for vector popcount
rlupusoru
parents: 48490
diff changeset
   667
    _features &= ~CPU_AVX512_VPOPCNTDQ;
49614
3b1570be8557 8200067: Add support for vpclmulqdq for crc32
srukmannagar
parents: 49384
diff changeset
   668
    _features &= ~CPU_VPCLMULQDQ;
50699
cc7fc46cc8c1 8205398: AES-CBC decryption algorithm using AVX512 instructions
kvn
parents: 50534
diff changeset
   669
    _features &= ~CPU_VAES;
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   670
  }
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   671
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   672
  if (UseAVX < 2)
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   673
    _features &= ~CPU_AVX2;
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   674
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   675
  if (UseAVX < 1) {
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   676
    _features &= ~CPU_AVX;
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   677
    _features &= ~CPU_VZEROUPPER;
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   678
  }
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   679
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   680
  if (logical_processors_per_package() == 1) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   681
    // HT processor could be installed on a system which doesn't support HT.
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   682
    _features &= ~CPU_HT;
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   683
  }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   684
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   685
  if( is_intel() ) { // Intel cpus specific settings
46563
cfca8fbb4051 8182138: Disable generating INC and DEC instructions on Xeon Phi and ATOM CPUs
kvn
parents: 46560
diff changeset
   686
    if (is_knights_family()) {
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   687
      _features &= ~CPU_VZEROUPPER;
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   688
    }
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   689
  }
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   690
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   691
  char buf[256];
41323
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   692
  jio_snprintf(buf, sizeof(buf), "(%u cores per cpu, %u threads per core) family %d model %d stepping %d%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s",
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   693
               cores_per_cpu(), threads_per_core(),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   694
               cpu_family(), _model, _stepping,
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   695
               (supports_cmov() ? ", cmov" : ""),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   696
               (supports_cmpxchg8() ? ", cx8" : ""),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   697
               (supports_fxsr() ? ", fxsr" : ""),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   698
               (supports_mmx()  ? ", mmx"  : ""),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   699
               (supports_sse()  ? ", sse"  : ""),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   700
               (supports_sse2() ? ", sse2" : ""),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   701
               (supports_sse3() ? ", sse3" : ""),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   702
               (supports_ssse3()? ", ssse3": ""),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   703
               (supports_sse4_1() ? ", sse4.1" : ""),
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   704
               (supports_sse4_2() ? ", sse4.2" : ""),
2255
54abdf3e1055 6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents: 2111
diff changeset
   705
               (supports_popcnt() ? ", popcnt" : ""),
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   706
               (supports_avx()    ? ", avx" : ""),
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
   707
               (supports_avx2()   ? ", avx2" : ""),
14132
3c1437abcefd 7184394: add intrinsics to use AES instructions
kvn
parents: 13886
diff changeset
   708
               (supports_aes()    ? ", aes" : ""),
23491
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   709
               (supports_clmul()  ? ", clmul" : ""),
15114
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
   710
               (supports_erms()   ? ", erms" : ""),
23491
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   711
               (supports_rtm()    ? ", rtm" : ""),
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   712
               (supports_mmx_ext() ? ", mmxext" : ""),
9135
f76543993e9d 7035713: 3DNow Prefetch Instruction Support
kvn
parents: 8921
diff changeset
   713
               (supports_3dnow_prefetch() ? ", 3dnowpref" : ""),
2862
fad636edf18f 6823354: Add intrinsics for {Integer,Long}.{numberOfLeadingZeros,numberOfTrailingZeros}()
twisti
parents: 2348
diff changeset
   714
               (supports_lzcnt()   ? ", lzcnt": ""),
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   715
               (supports_sse4a()   ? ", sse4a": ""),
11417
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   716
               (supports_ht() ? ", ht": ""),
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   717
               (supports_tsc() ? ", tsc": ""),
4ecc3253bec4 7125934: Add a fast unordered timestamp capability to Hotspot on x86/x64
phh
parents: 10565
diff changeset
   718
               (supports_tscinv_bit() ? ", tscinvbit": ""),
23220
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
   719
               (supports_tscinv() ? ", tscinv": ""),
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
   720
               (supports_bmi1() ? ", bmi1" : ""),
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
   721
               (supports_bmi2() ? ", bmi2" : ""),
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   722
               (supports_adx() ? ", adx" : ""),
36555
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   723
               (supports_evex() ? ", evex" : ""),
41323
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   724
               (supports_sha() ? ", sha" : ""),
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   725
               (supports_fma() ? ", fma" : ""));
35148
5cfafc99d791 8143072: [JVMCI] Port JVMCI to AArch64
twisti
parents: 35111
diff changeset
   726
  _features_string = os::strdup(buf);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   727
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   728
  // UseSSE is set to the smaller of what hardware supports and what
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   729
  // the command line requires.  I.e., you cannot set UseSSE to 2 on
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   730
  // older Pentiums which do not support it.
48195
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   731
  int use_sse_limit = 0;
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   732
  if (UseSSE > 0) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   733
    if (UseSSE > 3 && supports_sse4_1()) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   734
      use_sse_limit = 4;
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   735
    } else if (UseSSE > 2 && supports_sse3()) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   736
      use_sse_limit = 3;
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   737
    } else if (UseSSE > 1 && supports_sse2()) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   738
      use_sse_limit = 2;
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   739
    } else if (UseSSE > 0 && supports_sse()) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   740
      use_sse_limit = 1;
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   741
    } else {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   742
      use_sse_limit = 0;
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   743
    }
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   744
  }
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   745
  if (FLAG_IS_DEFAULT(UseSSE)) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   746
    FLAG_SET_DEFAULT(UseSSE, use_sse_limit);
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   747
  } else if (UseSSE > use_sse_limit) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   748
    warning("UseSSE=%d is not supported on this CPU, setting it to UseSSE=%d", (int) UseSSE, use_sse_limit);
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   749
    FLAG_SET_DEFAULT(UseSSE, use_sse_limit);
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   750
  } else if (UseSSE < 0) {
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   751
    warning("UseSSE=%d is not valid, setting it to UseSSE=0", (int) UseSSE);
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   752
    FLAG_SET_DEFAULT(UseSSE, 0);
255407049d98 8170244: Update UseAVX after cpu feature detection to use more default mapping
vdeshpande
parents: 47799
diff changeset
   753
  }
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
   754
14132
3c1437abcefd 7184394: add intrinsics to use AES instructions
kvn
parents: 13886
diff changeset
   755
  // Use AES instructions if available.
3c1437abcefd 7184394: add intrinsics to use AES instructions
kvn
parents: 13886
diff changeset
   756
  if (supports_aes()) {
3c1437abcefd 7184394: add intrinsics to use AES instructions
kvn
parents: 13886
diff changeset
   757
    if (FLAG_IS_DEFAULT(UseAES)) {
34176
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   758
      FLAG_SET_DEFAULT(UseAES, true);
14132
3c1437abcefd 7184394: add intrinsics to use AES instructions
kvn
parents: 13886
diff changeset
   759
    }
34176
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   760
    if (!UseAES) {
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   761
      if (UseAESIntrinsics && !FLAG_IS_DEFAULT(UseAESIntrinsics)) {
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   762
        warning("AES intrinsics require UseAES flag to be enabled. Intrinsics will be disabled.");
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   763
      }
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   764
      FLAG_SET_DEFAULT(UseAESIntrinsics, false);
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   765
    } else {
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   766
      if (UseSSE > 2) {
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   767
        if (FLAG_IS_DEFAULT(UseAESIntrinsics)) {
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   768
          FLAG_SET_DEFAULT(UseAESIntrinsics, true);
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   769
        }
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   770
      } else {
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   771
        // The AES intrinsic stubs require AES instruction support (of course)
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   772
        // but also require sse3 mode or higher for instructions it use.
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   773
        if (UseAESIntrinsics && !FLAG_IS_DEFAULT(UseAESIntrinsics)) {
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   774
          warning("X86 AES intrinsics require SSE3 instructions or higher. Intrinsics will be disabled.");
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   775
        }
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   776
        FLAG_SET_DEFAULT(UseAESIntrinsics, false);
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   777
      }
35154
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   778
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   779
      // --AES-CTR begins--
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   780
      if (!UseAESIntrinsics) {
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   781
        if (UseAESCTRIntrinsics && !FLAG_IS_DEFAULT(UseAESCTRIntrinsics)) {
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   782
          warning("AES-CTR intrinsics require UseAESIntrinsics flag to be enabled. Intrinsics will be disabled.");
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   783
          FLAG_SET_DEFAULT(UseAESCTRIntrinsics, false);
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   784
        }
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   785
      } else {
39256
ac12f57c6d9c 8158214: Crash with "assert(VM_Version::supports_sse4_1()) failed" if UseSSE < 4 is set
thartmann
parents: 38135
diff changeset
   786
        if(supports_sse4_1()) {
35154
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   787
          if (FLAG_IS_DEFAULT(UseAESCTRIntrinsics)) {
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   788
            FLAG_SET_DEFAULT(UseAESCTRIntrinsics, true);
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   789
          }
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   790
        } else {
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   791
           // The AES-CTR intrinsic stubs require AES instruction support (of course)
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   792
           // but also require sse4.1 mode or higher for instructions it use.
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   793
          if (UseAESCTRIntrinsics && !FLAG_IS_DEFAULT(UseAESCTRIntrinsics)) {
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   794
             warning("X86 AES-CTR intrinsics require SSE4.1 instructions or higher. Intrinsics will be disabled.");
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   795
           }
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   796
           FLAG_SET_DEFAULT(UseAESCTRIntrinsics, false);
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   797
        }
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   798
      }
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   799
      // --AES-CTR ends--
34176
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   800
    }
35537
bed5e2dc57a1 8146581: Minor corrections to the patch submitted for earlier bug id - 8143925
kvn
parents: 35154
diff changeset
   801
  } else if (UseAES || UseAESIntrinsics || UseAESCTRIntrinsics) {
34176
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   802
    if (UseAES && !FLAG_IS_DEFAULT(UseAES)) {
23491
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   803
      warning("AES instructions are not available on this CPU");
34176
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   804
      FLAG_SET_DEFAULT(UseAES, false);
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   805
    }
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   806
    if (UseAESIntrinsics && !FLAG_IS_DEFAULT(UseAESIntrinsics)) {
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   807
      warning("AES intrinsics are not available on this CPU");
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   808
      FLAG_SET_DEFAULT(UseAESIntrinsics, false);
c1b52e665b47 8131778: java disables UseAES flag when using VIS=2 on sparc
kshefov
parents: 34162
diff changeset
   809
    }
35154
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   810
    if (UseAESCTRIntrinsics && !FLAG_IS_DEFAULT(UseAESCTRIntrinsics)) {
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   811
      warning("AES-CTR intrinsics are not available on this CPU");
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   812
      FLAG_SET_DEFAULT(UseAESCTRIntrinsics, false);
a9b3c1984a01 8143925: Enhancing CounterMode.crypt() for AES
kvn
parents: 35148
diff changeset
   813
    }
14132
3c1437abcefd 7184394: add intrinsics to use AES instructions
kvn
parents: 13886
diff changeset
   814
  }
3c1437abcefd 7184394: add intrinsics to use AES instructions
kvn
parents: 13886
diff changeset
   815
18507
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   816
  // Use CLMUL instructions if available.
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   817
  if (supports_clmul()) {
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   818
    if (FLAG_IS_DEFAULT(UseCLMUL)) {
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   819
      UseCLMUL = true;
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   820
    }
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   821
  } else if (UseCLMUL) {
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   822
    if (!FLAG_IS_DEFAULT(UseCLMUL))
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   823
      warning("CLMUL instructions not available on this CPU (AVX may also be required)");
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   824
    FLAG_SET_DEFAULT(UseCLMUL, false);
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   825
  }
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   826
25932
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
   827
  if (UseCLMUL && (UseSSE > 2)) {
18507
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   828
    if (FLAG_IS_DEFAULT(UseCRC32Intrinsics)) {
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   829
      UseCRC32Intrinsics = true;
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   830
    }
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   831
  } else if (UseCRC32Intrinsics) {
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   832
    if (!FLAG_IS_DEFAULT(UseCRC32Intrinsics))
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
   833
      warning("CRC32 Intrinsics requires CLMUL instructions (not available on this CPU)");
18507
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   834
    FLAG_SET_DEFAULT(UseCRC32Intrinsics, false);
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   835
  }
61bfc8995bb3 7088419: Use x86 Hardware CRC32 Instruction with java.util.zip.CRC32
drchase
parents: 15243
diff changeset
   836
44737
d090627aedb8 8178723: Workaround for failure of CRC32C intrinsic on x86 machines without CLMUL support (JDK-8178720)
zmajo
parents: 43936
diff changeset
   837
  if (supports_sse4_2() && supports_clmul()) {
33066
d98eab8215c4 8134553: CRC32C implementations for x86/x64 targets
kvn
parents: 32727
diff changeset
   838
    if (FLAG_IS_DEFAULT(UseCRC32CIntrinsics)) {
d98eab8215c4 8134553: CRC32C implementations for x86/x64 targets
kvn
parents: 32727
diff changeset
   839
      UseCRC32CIntrinsics = true;
d98eab8215c4 8134553: CRC32C implementations for x86/x64 targets
kvn
parents: 32727
diff changeset
   840
    }
44737
d090627aedb8 8178723: Workaround for failure of CRC32C intrinsic on x86 machines without CLMUL support (JDK-8178720)
zmajo
parents: 43936
diff changeset
   841
  } else if (UseCRC32CIntrinsics) {
33066
d98eab8215c4 8134553: CRC32C implementations for x86/x64 targets
kvn
parents: 32727
diff changeset
   842
    if (!FLAG_IS_DEFAULT(UseCRC32CIntrinsics)) {
d98eab8215c4 8134553: CRC32C implementations for x86/x64 targets
kvn
parents: 32727
diff changeset
   843
      warning("CRC32C intrinsics are not available on this CPU");
d98eab8215c4 8134553: CRC32C implementations for x86/x64 targets
kvn
parents: 32727
diff changeset
   844
    }
d98eab8215c4 8134553: CRC32C implementations for x86/x64 targets
kvn
parents: 32727
diff changeset
   845
    FLAG_SET_DEFAULT(UseCRC32CIntrinsics, false);
d98eab8215c4 8134553: CRC32C implementations for x86/x64 targets
kvn
parents: 32727
diff changeset
   846
  }
d98eab8215c4 8134553: CRC32C implementations for x86/x64 targets
kvn
parents: 32727
diff changeset
   847
31404
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   848
  // GHASH/GCM intrinsics
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   849
  if (UseCLMUL && (UseSSE > 2)) {
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   850
    if (FLAG_IS_DEFAULT(UseGHASHIntrinsics)) {
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   851
      UseGHASHIntrinsics = true;
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   852
    }
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   853
  } else if (UseGHASHIntrinsics) {
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   854
    if (!FLAG_IS_DEFAULT(UseGHASHIntrinsics))
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   855
      warning("GHASH intrinsic requires CLMUL and SSE2 instructions on this CPU");
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   856
    FLAG_SET_DEFAULT(UseGHASHIntrinsics, false);
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   857
  }
63e8fcd70bfc 8073108: Use x86 and SPARC CPU instructions for GHASH acceleration
ascarpino
parents: 31129
diff changeset
   858
50860
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   859
  // Base64 Intrinsics (Check the condition for which the intrinsic will be active)
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   860
  if ((UseAVX > 2) && supports_avx512vl() && supports_avx512bw()) {
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   861
    if (FLAG_IS_DEFAULT(UseBASE64Intrinsics)) {
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   862
      UseBASE64Intrinsics = true;
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   863
    }
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   864
  } else if (UseBASE64Intrinsics) {
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   865
     if (!FLAG_IS_DEFAULT(UseBASE64Intrinsics))
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   866
      warning("Base64 intrinsic requires EVEX instructions on this CPU");
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   867
    FLAG_SET_DEFAULT(UseBASE64Intrinsics, false);
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   868
  }
480a96a43b62 8205528: Base64 encoding algorithm using AVX512 instructions
kvn
parents: 50699
diff changeset
   869
46546
4dba7f5446f3 8182114: assert(VM_Version::supports_sse()) failed
kvn
parents: 46528
diff changeset
   870
  if (supports_fma() && UseSSE >= 2) { // Check UseSSE since FMA code uses SSE instructions
41323
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   871
    if (FLAG_IS_DEFAULT(UseFMA)) {
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   872
      UseFMA = true;
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   873
    }
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   874
  } else if (UseFMA) {
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   875
    warning("FMA instructions are not available on this CPU");
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   876
    FLAG_SET_DEFAULT(UseFMA, false);
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   877
  }
ddd5600d4762 8154122: Intrinsify fused mac operations
vdeshpande
parents: 39256
diff changeset
   878
38135
e06e2d071465 8154495: SHA256 AVX2 intrinsic (when no supports_sha() available)
jcivlin
parents: 37430
diff changeset
   879
  if (supports_sha() LP64_ONLY(|| supports_avx2() && supports_bmi2())) {
36555
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   880
    if (FLAG_IS_DEFAULT(UseSHA)) {
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   881
      UseSHA = true;
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   882
    }
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   883
  } else if (UseSHA) {
24953
9680119572be 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 24424
diff changeset
   884
    warning("SHA instructions are not available on this CPU");
9680119572be 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 24424
diff changeset
   885
    FLAG_SET_DEFAULT(UseSHA, false);
9680119572be 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 24424
diff changeset
   886
  }
31588
2a864a4a414c 8130120: Handling of SHA intrinsics inconsistent across platforms
zmajo
parents: 31584
diff changeset
   887
51868
92960b0e6191 8211061: Tests fail with assert(VM_Version::supports_sse4_1()) on ThreadRipper CPU
rkennke
parents: 51857
diff changeset
   888
  if (supports_sha() && supports_sse4_1() && UseSHA) {
36555
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   889
    if (FLAG_IS_DEFAULT(UseSHA1Intrinsics)) {
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   890
      FLAG_SET_DEFAULT(UseSHA1Intrinsics, true);
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   891
    }
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   892
  } else if (UseSHA1Intrinsics) {
31588
2a864a4a414c 8130120: Handling of SHA intrinsics inconsistent across platforms
zmajo
parents: 31584
diff changeset
   893
    warning("Intrinsics for SHA-1 crypto hash functions not available on this CPU.");
24953
9680119572be 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 24424
diff changeset
   894
    FLAG_SET_DEFAULT(UseSHA1Intrinsics, false);
31588
2a864a4a414c 8130120: Handling of SHA intrinsics inconsistent across platforms
zmajo
parents: 31584
diff changeset
   895
  }
2a864a4a414c 8130120: Handling of SHA intrinsics inconsistent across platforms
zmajo
parents: 31584
diff changeset
   896
51868
92960b0e6191 8211061: Tests fail with assert(VM_Version::supports_sse4_1()) on ThreadRipper CPU
rkennke
parents: 51857
diff changeset
   897
  if (supports_sse4_1() && UseSHA) {
36555
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   898
    if (FLAG_IS_DEFAULT(UseSHA256Intrinsics)) {
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   899
      FLAG_SET_DEFAULT(UseSHA256Intrinsics, true);
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   900
    }
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   901
  } else if (UseSHA256Intrinsics) {
31588
2a864a4a414c 8130120: Handling of SHA intrinsics inconsistent across platforms
zmajo
parents: 31584
diff changeset
   902
    warning("Intrinsics for SHA-224 and SHA-256 crypto hash functions not available on this CPU.");
24953
9680119572be 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 24424
diff changeset
   903
    FLAG_SET_DEFAULT(UseSHA256Intrinsics, false);
31588
2a864a4a414c 8130120: Handling of SHA intrinsics inconsistent across platforms
zmajo
parents: 31584
diff changeset
   904
  }
2a864a4a414c 8130120: Handling of SHA intrinsics inconsistent across platforms
zmajo
parents: 31584
diff changeset
   905
48444
a97a26eb896f 8194494: SHA-512 stub uses AVX 2 instructions on non-supporting CPUs
thartmann
parents: 48195
diff changeset
   906
  if (UseSHA && supports_avx2() && supports_bmi2()) {
42039
db627462f2c9 8165381: Update for x86 SHA512 using AVX2
kvn
parents: 41323
diff changeset
   907
    if (FLAG_IS_DEFAULT(UseSHA512Intrinsics)) {
db627462f2c9 8165381: Update for x86 SHA512 using AVX2
kvn
parents: 41323
diff changeset
   908
      FLAG_SET_DEFAULT(UseSHA512Intrinsics, true);
db627462f2c9 8165381: Update for x86 SHA512 using AVX2
kvn
parents: 41323
diff changeset
   909
    }
db627462f2c9 8165381: Update for x86 SHA512 using AVX2
kvn
parents: 41323
diff changeset
   910
  } else if (UseSHA512Intrinsics) {
31588
2a864a4a414c 8130120: Handling of SHA intrinsics inconsistent across platforms
zmajo
parents: 31584
diff changeset
   911
    warning("Intrinsics for SHA-384 and SHA-512 crypto hash functions not available on this CPU.");
24953
9680119572be 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 24424
diff changeset
   912
    FLAG_SET_DEFAULT(UseSHA512Intrinsics, false);
9680119572be 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 24424
diff changeset
   913
  }
9680119572be 8035968: Leverage CPU Instructions to Improve SHA Performance on SPARC
kvn
parents: 24424
diff changeset
   914
36555
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   915
  if (!(UseSHA1Intrinsics || UseSHA256Intrinsics || UseSHA512Intrinsics)) {
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   916
    FLAG_SET_DEFAULT(UseSHA, false);
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   917
  }
4f37fd7a5a09 8150767: Enables SHA Extensions on x86
vdeshpande
parents: 35751
diff changeset
   918
32581
632402f18fe6 8132081: C2 support for Adler32 on SPARC
kvn
parents: 31588
diff changeset
   919
  if (UseAdler32Intrinsics) {
632402f18fe6 8132081: C2 support for Adler32 on SPARC
kvn
parents: 31588
diff changeset
   920
    warning("Adler32Intrinsics not available on this CPU.");
632402f18fe6 8132081: C2 support for Adler32 on SPARC
kvn
parents: 31588
diff changeset
   921
    FLAG_SET_DEFAULT(UseAdler32Intrinsics, false);
632402f18fe6 8132081: C2 support for Adler32 on SPARC
kvn
parents: 31588
diff changeset
   922
  }
632402f18fe6 8132081: C2 support for Adler32 on SPARC
kvn
parents: 31588
diff changeset
   923
23491
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   924
  if (!supports_rtm() && UseRTMLocking) {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   925
    // Can't continue because UseRTMLocking affects UseBiasedLocking flag
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   926
    // setting during arguments processing. See use_biased_locking().
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   927
    // VM_Version_init() is executed after UseBiasedLocking is used
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   928
    // in Thread::allocate().
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   929
    vm_exit_during_initialization("RTM instructions are not available on this CPU");
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   930
  }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   931
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   932
#if INCLUDE_RTM_OPT
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   933
  if (UseRTMLocking) {
43936
093cd5bea2e2 8173679: Disable ProfileTrap code and UseRTMLocking in emulated client Win32
jcm
parents: 42586
diff changeset
   934
    if (is_client_compilation_mode_vm()) {
093cd5bea2e2 8173679: Disable ProfileTrap code and UseRTMLocking in emulated client Win32
jcm
parents: 42586
diff changeset
   935
      // Only C2 does RTM locking optimization.
093cd5bea2e2 8173679: Disable ProfileTrap code and UseRTMLocking in emulated client Win32
jcm
parents: 42586
diff changeset
   936
      // Can't continue because UseRTMLocking affects UseBiasedLocking flag
093cd5bea2e2 8173679: Disable ProfileTrap code and UseRTMLocking in emulated client Win32
jcm
parents: 42586
diff changeset
   937
      // setting during arguments processing. See use_biased_locking().
50261
3fd701692627 8184030: TestUseRTMLockingOptionOnUnsupportedVM - RTM locking optimization not supported is missing
jcm
parents: 49614
diff changeset
   938
      vm_exit_during_initialization("RTM locking optimization is not supported in this VM");
43936
093cd5bea2e2 8173679: Disable ProfileTrap code and UseRTMLocking in emulated client Win32
jcm
parents: 42586
diff changeset
   939
    }
26306
2b4cf8eb3de7 8055069: TSX and RTM should be deprecated more strongly until hardware is corrected
kvn
parents: 25949
diff changeset
   940
    if (is_intel_family_core()) {
2b4cf8eb3de7 8055069: TSX and RTM should be deprecated more strongly until hardware is corrected
kvn
parents: 25949
diff changeset
   941
      if ((_model == CPU_MODEL_HASWELL_E3) ||
2b4cf8eb3de7 8055069: TSX and RTM should be deprecated more strongly until hardware is corrected
kvn
parents: 25949
diff changeset
   942
          (_model == CPU_MODEL_HASWELL_E7 && _stepping < 3) ||
2b4cf8eb3de7 8055069: TSX and RTM should be deprecated more strongly until hardware is corrected
kvn
parents: 25949
diff changeset
   943
          (_model == CPU_MODEL_BROADWELL  && _stepping < 4)) {
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   944
        // currently a collision between SKL and HSW_E3
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   945
        if (!UnlockExperimentalVMOptions && UseAVX < 3) {
46698
fa625dca9270 8184800: Streamline RTM flag validity testing with generic flag testing support
goetz
parents: 46630
diff changeset
   946
          vm_exit_during_initialization("UseRTMLocking is only available as experimental option on this "
fa625dca9270 8184800: Streamline RTM flag validity testing with generic flag testing support
goetz
parents: 46630
diff changeset
   947
                                        "platform. It must be enabled via -XX:+UnlockExperimentalVMOptions flag.");
26306
2b4cf8eb3de7 8055069: TSX and RTM should be deprecated more strongly until hardware is corrected
kvn
parents: 25949
diff changeset
   948
        } else {
2b4cf8eb3de7 8055069: TSX and RTM should be deprecated more strongly until hardware is corrected
kvn
parents: 25949
diff changeset
   949
          warning("UseRTMLocking is only available as experimental option on this platform.");
2b4cf8eb3de7 8055069: TSX and RTM should be deprecated more strongly until hardware is corrected
kvn
parents: 25949
diff changeset
   950
        }
2b4cf8eb3de7 8055069: TSX and RTM should be deprecated more strongly until hardware is corrected
kvn
parents: 25949
diff changeset
   951
      }
2b4cf8eb3de7 8055069: TSX and RTM should be deprecated more strongly until hardware is corrected
kvn
parents: 25949
diff changeset
   952
    }
23491
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   953
    if (!FLAG_IS_CMDLINE(UseRTMLocking)) {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   954
      // RTM locking should be used only for applications with
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   955
      // high lock contention. For now we do not use it by default.
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   956
      vm_exit_during_initialization("UseRTMLocking flag should be only set on command line");
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   957
    }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   958
  } else { // !UseRTMLocking
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   959
    if (UseRTMForStackLocks) {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   960
      if (!FLAG_IS_DEFAULT(UseRTMForStackLocks)) {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   961
        warning("UseRTMForStackLocks flag should be off when UseRTMLocking flag is off");
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   962
      }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   963
      FLAG_SET_DEFAULT(UseRTMForStackLocks, false);
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   964
    }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   965
    if (UseRTMDeopt) {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   966
      FLAG_SET_DEFAULT(UseRTMDeopt, false);
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   967
    }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   968
    if (PrintPreciseRTMLockingStatistics) {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   969
      FLAG_SET_DEFAULT(PrintPreciseRTMLockingStatistics, false);
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   970
    }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   971
  }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   972
#else
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   973
  if (UseRTMLocking) {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   974
    // Only C2 does RTM locking optimization.
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   975
    // Can't continue because UseRTMLocking affects UseBiasedLocking flag
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   976
    // setting during arguments processing. See use_biased_locking().
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   977
    vm_exit_during_initialization("RTM locking optimization is not supported in this VM");
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   978
  }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   979
#endif
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
   980
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   981
#ifdef COMPILER2
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   982
  if (UseFPUForSpilling) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   983
    if (UseSSE < 2) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   984
      // Only supported with SSE2+
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   985
      FLAG_SET_DEFAULT(UseFPUForSpilling, false);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   986
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   987
  }
33160
c59f1676d27e 8136421: JEP 243: Java-Level JVM Compiler Interface
twisti
parents: 33066
diff changeset
   988
#endif
47799
1772ebf07d1f 8152470: Add COMPILER2_OR_JVMCI definition
jcm
parents: 47765
diff changeset
   989
#if COMPILER2_OR_JVMCI
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   990
  if (MaxVectorSize > 0) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   991
    if (!is_power_of_2(MaxVectorSize)) {
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   992
      warning("MaxVectorSize must be a power of 2");
30624
2e1803c8a26d 8076276: Add support for AVX512
kvn
parents: 30227
diff changeset
   993
      FLAG_SET_DEFAULT(MaxVectorSize, 64);
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   994
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
   995
    if (UseSSE < 2) {
23487
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
   996
      // Vectors (in XMM) are only supported with SSE2+
46440
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   997
      if (MaxVectorSize > 0) {
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   998
        if (!FLAG_IS_DEFAULT(MaxVectorSize))
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
   999
          warning("MaxVectorSize must be 0");
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1000
        FLAG_SET_DEFAULT(MaxVectorSize, 0);
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1001
      }
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1002
    }
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1003
    else if (UseAVX == 0 || !os_supports_avx_vectors()) {
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1004
      // 32 bytes vectors (in YMM) are only supported with AVX+
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1005
      if (MaxVectorSize > 16) {
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1006
        if (!FLAG_IS_DEFAULT(MaxVectorSize))
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1007
          warning("MaxVectorSize must be <= 16");
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1008
        FLAG_SET_DEFAULT(MaxVectorSize, 16);
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1009
      }
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1010
    }
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1011
    else if (UseAVX == 1 || UseAVX == 2) {
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1012
      // 64 bytes vectors (in ZMM) are only supported with AVX 3
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1013
      if (MaxVectorSize > 32) {
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1014
        if (!FLAG_IS_DEFAULT(MaxVectorSize))
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1015
          warning("MaxVectorSize must be <= 32");
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1016
        FLAG_SET_DEFAULT(MaxVectorSize, 32);
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1017
      }
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1018
    }
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1019
    else if (UseAVX > 2 ) {
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1020
      if (MaxVectorSize > 64) {
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1021
        if (!FLAG_IS_DEFAULT(MaxVectorSize))
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1022
          warning("MaxVectorSize must be <= 64");
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1023
        FLAG_SET_DEFAULT(MaxVectorSize, 64);
61025eecb743 8178811: Minimize the AVX <-> SSE transition penalty through generation of vzeroupper instruction on x86
vdeshpande
parents: 43936
diff changeset
  1024
      }
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
  1025
    }
33160
c59f1676d27e 8136421: JEP 243: Java-Level JVM Compiler Interface
twisti
parents: 33066
diff changeset
  1026
#if defined(COMPILER2) && defined(ASSERT)
23487
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1027
    if (supports_avx() && PrintMiscellaneous && Verbose && TraceNewVectors) {
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1028
      tty->print_cr("State of YMM registers after signal handle:");
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1029
      int nreg = 2 LP64_ONLY(+2);
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1030
      const char* ymm_name[4] = {"0", "7", "8", "15"};
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1031
      for (int i = 0; i < nreg; i++) {
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1032
        tty->print("YMM%s:", ymm_name[i]);
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1033
        for (int j = 7; j >=0; j--) {
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1034
          tty->print(" %x", _cpuid_info.ymm_save[i*8 + j]);
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1035
        }
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1036
        tty->cr();
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1037
      }
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1038
    }
33160
c59f1676d27e 8136421: JEP 243: Java-Level JVM Compiler Interface
twisti
parents: 33066
diff changeset
  1039
#endif // COMPILER2 && ASSERT
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
  1040
  }
47799
1772ebf07d1f 8152470: Add COMPILER2_OR_JVMCI definition
jcm
parents: 47765
diff changeset
  1041
#endif // COMPILER2_OR_JVMCI
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1042
33160
c59f1676d27e 8136421: JEP 243: Java-Level JVM Compiler Interface
twisti
parents: 33066
diff changeset
  1043
#ifdef COMPILER2
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1044
#ifdef _LP64
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1045
  if (FLAG_IS_DEFAULT(UseMultiplyToLenIntrinsic)) {
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1046
    UseMultiplyToLenIntrinsic = true;
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1047
  }
31129
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1048
  if (FLAG_IS_DEFAULT(UseSquareToLenIntrinsic)) {
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1049
    UseSquareToLenIntrinsic = true;
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1050
  }
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1051
  if (FLAG_IS_DEFAULT(UseMulAddIntrinsic)) {
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1052
    UseMulAddIntrinsic = true;
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1053
  }
31583
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1054
  if (FLAG_IS_DEFAULT(UseMontgomeryMultiplyIntrinsic)) {
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1055
    UseMontgomeryMultiplyIntrinsic = true;
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1056
  }
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1057
  if (FLAG_IS_DEFAULT(UseMontgomerySquareIntrinsic)) {
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1058
    UseMontgomerySquareIntrinsic = true;
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1059
  }
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1060
#else
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1061
  if (UseMultiplyToLenIntrinsic) {
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1062
    if (!FLAG_IS_DEFAULT(UseMultiplyToLenIntrinsic)) {
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1063
      warning("multiplyToLen intrinsic is not available in 32-bit VM");
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1064
    }
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1065
    FLAG_SET_DEFAULT(UseMultiplyToLenIntrinsic, false);
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1066
  }
31583
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1067
  if (UseMontgomeryMultiplyIntrinsic) {
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1068
    if (!FLAG_IS_DEFAULT(UseMontgomeryMultiplyIntrinsic)) {
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1069
      warning("montgomeryMultiply intrinsic is not available in 32-bit VM");
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1070
    }
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1071
    FLAG_SET_DEFAULT(UseMontgomeryMultiplyIntrinsic, false);
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1072
  }
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1073
  if (UseMontgomerySquareIntrinsic) {
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1074
    if (!FLAG_IS_DEFAULT(UseMontgomerySquareIntrinsic)) {
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1075
      warning("montgomerySquare intrinsic is not available in 32-bit VM");
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1076
    }
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1077
    FLAG_SET_DEFAULT(UseMontgomerySquareIntrinsic, false);
eb5bea7b4835 8130150: Implement BigInteger.montgomeryMultiply intrinsic
aph
parents: 31129
diff changeset
  1078
  }
31129
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1079
  if (UseSquareToLenIntrinsic) {
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1080
    if (!FLAG_IS_DEFAULT(UseSquareToLenIntrinsic)) {
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1081
      warning("squareToLen intrinsic is not available in 32-bit VM");
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1082
    }
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1083
    FLAG_SET_DEFAULT(UseSquareToLenIntrinsic, false);
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1084
  }
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1085
  if (UseMulAddIntrinsic) {
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1086
    if (!FLAG_IS_DEFAULT(UseMulAddIntrinsic)) {
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1087
      warning("mulAdd intrinsic is not available in 32-bit VM");
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1088
    }
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1089
    FLAG_SET_DEFAULT(UseMulAddIntrinsic, false);
02ee7609f0e1 8081778: Use Intel x64 CPU instructions for RSA acceleration
kvn
parents: 30624
diff changeset
  1090
  }
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
  1091
#endif
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1092
#endif // COMPILER2
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
  1093
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1094
  // On new cpus instructions which update whole XMM register should be used
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1095
  // to prevent partial register stall due to dependencies on high half.
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1096
  //
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1097
  // UseXmmLoadAndClearUpper == true  --> movsd(xmm, mem)
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1098
  // UseXmmLoadAndClearUpper == false --> movlpd(xmm, mem)
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1099
  // UseXmmRegToRegMoveAll == true  --> movaps(xmm, xmm), movapd(xmm, xmm).
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1100
  // UseXmmRegToRegMoveAll == false --> movss(xmm, xmm),  movsd(xmm, xmm).
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1101
48489
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1102
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1103
  if (is_zx()) { // ZX cpus specific settings
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1104
    if (FLAG_IS_DEFAULT(UseStoreImmI16)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1105
      UseStoreImmI16 = false; // don't use it on ZX cpus
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1106
    }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1107
    if ((cpu_family() == 6) || (cpu_family() == 7)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1108
      if (FLAG_IS_DEFAULT(UseAddressNop)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1109
        // Use it on all ZX cpus
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1110
        UseAddressNop = true;
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1111
      }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1112
    }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1113
    if (FLAG_IS_DEFAULT(UseXmmLoadAndClearUpper)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1114
      UseXmmLoadAndClearUpper = true; // use movsd on all ZX cpus
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1115
    }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1116
    if (FLAG_IS_DEFAULT(UseXmmRegToRegMoveAll)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1117
      if (supports_sse3()) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1118
        UseXmmRegToRegMoveAll = true; // use movaps, movapd on new ZX cpus
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1119
      } else {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1120
        UseXmmRegToRegMoveAll = false;
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1121
      }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1122
    }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1123
    if (((cpu_family() == 6) || (cpu_family() == 7)) && supports_sse3()) { // new ZX cpus
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1124
#ifdef COMPILER2
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1125
      if (FLAG_IS_DEFAULT(MaxLoopPad)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1126
        // For new ZX cpus do the next optimization:
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1127
        // don't align the beginning of a loop if there are enough instructions
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1128
        // left (NumberOfLoopInstrToAlign defined in c2_globals.hpp)
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1129
        // in current fetch line (OptoLoopAlignment) or the padding
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1130
        // is big (> MaxLoopPad).
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1131
        // Set MaxLoopPad to 11 for new ZX cpus to reduce number of
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1132
        // generated NOP instructions. 11 is the largest size of one
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1133
        // address NOP instruction '0F 1F' (see Assembler::nop(i)).
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1134
        MaxLoopPad = 11;
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1135
      }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1136
#endif // COMPILER2
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1137
      if (FLAG_IS_DEFAULT(UseXMMForArrayCopy)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1138
        UseXMMForArrayCopy = true; // use SSE2 movq on new ZX cpus
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1139
      }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1140
      if (supports_sse4_2()) { // new ZX cpus
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1141
        if (FLAG_IS_DEFAULT(UseUnalignedLoadStores)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1142
          UseUnalignedLoadStores = true; // use movdqu on newest ZX cpus
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1143
        }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1144
      }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1145
      if (supports_sse4_2()) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1146
        if (FLAG_IS_DEFAULT(UseSSE42Intrinsics)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1147
          FLAG_SET_DEFAULT(UseSSE42Intrinsics, true);
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1148
        }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1149
      } else {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1150
        if (UseSSE42Intrinsics && !FLAG_IS_DEFAULT(UseAESIntrinsics)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1151
          warning("SSE4.2 intrinsics require SSE4.2 instructions or higher. Intrinsics will be disabled.");
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1152
        }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1153
        FLAG_SET_DEFAULT(UseSSE42Intrinsics, false);
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1154
      }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1155
    }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1156
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1157
    if (FLAG_IS_DEFAULT(AllocatePrefetchInstr) && supports_3dnow_prefetch()) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1158
      FLAG_SET_DEFAULT(AllocatePrefetchInstr, 3);
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1159
    }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1160
  }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1161
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1162
  if( is_amd() ) { // AMD cpus specific settings
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1163
    if( supports_sse2() && FLAG_IS_DEFAULT(UseAddressNop) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1164
      // Use it on new AMD cpus starting from Opteron.
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1165
      UseAddressNop = true;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1166
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1167
    if( supports_sse2() && FLAG_IS_DEFAULT(UseNewLongLShift) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1168
      // Use it on new AMD cpus starting from Opteron.
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1169
      UseNewLongLShift = true;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1170
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1171
    if( FLAG_IS_DEFAULT(UseXmmLoadAndClearUpper) ) {
34162
16b54851eaf6 8140779: Code generation fixes for avx512
iveresov
parents: 33163
diff changeset
  1172
      if (supports_sse4a()) {
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1173
        UseXmmLoadAndClearUpper = true; // use movsd only on '10h' Opteron
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1174
      } else {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1175
        UseXmmLoadAndClearUpper = false;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1176
      }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1177
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1178
    if( FLAG_IS_DEFAULT(UseXmmRegToRegMoveAll) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1179
      if( supports_sse4a() ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1180
        UseXmmRegToRegMoveAll = true; // use movaps, movapd only on '10h'
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1181
      } else {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1182
        UseXmmRegToRegMoveAll = false;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1183
      }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1184
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1185
    if( FLAG_IS_DEFAULT(UseXmmI2F) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1186
      if( supports_sse4a() ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1187
        UseXmmI2F = true;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1188
      } else {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1189
        UseXmmI2F = false;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1190
      }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1191
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1192
    if( FLAG_IS_DEFAULT(UseXmmI2D) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1193
      if( supports_sse4a() ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1194
        UseXmmI2D = true;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1195
      } else {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1196
        UseXmmI2D = false;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1197
      }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1198
    }
39256
ac12f57c6d9c 8158214: Crash with "assert(VM_Version::supports_sse4_1()) failed" if UseSSE < 4 is set
thartmann
parents: 38135
diff changeset
  1199
    if (supports_sse4_2()) {
34207
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1200
      if (FLAG_IS_DEFAULT(UseSSE42Intrinsics)) {
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1201
        FLAG_SET_DEFAULT(UseSSE42Intrinsics, true);
8873
d3031147b912 7032133: Enable sse4.2 for new AMD processors
kvn
parents: 8677
diff changeset
  1202
      }
34207
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1203
    } else {
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1204
      if (UseSSE42Intrinsics && !FLAG_IS_DEFAULT(UseAESIntrinsics)) {
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1205
        warning("SSE4.2 intrinsics require SSE4.2 instructions or higher. Intrinsics will be disabled.");
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1206
      }
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1207
      FLAG_SET_DEFAULT(UseSSE42Intrinsics, false);
8873
d3031147b912 7032133: Enable sse4.2 for new AMD processors
kvn
parents: 8677
diff changeset
  1208
    }
2862
fad636edf18f 6823354: Add intrinsics for {Integer,Long}.{numberOfLeadingZeros,numberOfTrailingZeros}()
twisti
parents: 2348
diff changeset
  1209
9325
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1210
    // some defaults for AMD family 15h
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1211
    if ( cpu_family() == 0x15 ) {
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1212
      // On family 15h processors default is no sw prefetch
8677
45d01baba334 7028394: Newer AMD Processor Prefetch Defaults
kvn
parents: 7397
diff changeset
  1213
      if (FLAG_IS_DEFAULT(AllocatePrefetchStyle)) {
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1214
        FLAG_SET_DEFAULT(AllocatePrefetchStyle, 0);
8677
45d01baba334 7028394: Newer AMD Processor Prefetch Defaults
kvn
parents: 7397
diff changeset
  1215
      }
9325
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1216
      // Also, if some other prefetch style is specified, default instruction type is PREFETCHW
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1217
      if (FLAG_IS_DEFAULT(AllocatePrefetchInstr)) {
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1218
        FLAG_SET_DEFAULT(AllocatePrefetchInstr, 3);
9325
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1219
      }
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1220
      // On family 15h processors use XMM and UnalignedLoadStores for Array Copy
13885
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1221
      if (supports_sse2() && FLAG_IS_DEFAULT(UseXMMForArrayCopy)) {
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1222
        FLAG_SET_DEFAULT(UseXMMForArrayCopy, true);
9325
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1223
      }
13885
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1224
      if (supports_sse2() && FLAG_IS_DEFAULT(UseUnalignedLoadStores)) {
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1225
        FLAG_SET_DEFAULT(UseUnalignedLoadStores, true);
9325
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1226
      }
8677
45d01baba334 7028394: Newer AMD Processor Prefetch Defaults
kvn
parents: 7397
diff changeset
  1227
    }
9325
2b95b2b2b60f 7037812: few more defaults changes for new AMD processors
kvn
parents: 9135
diff changeset
  1228
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
  1229
#ifdef COMPILER2
47582
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1230
    if (cpu_family() < 0x17 && MaxVectorSize > 16) {
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1231
      // Limit vectors size to 16 bytes on AMD cpus < 17h.
13104
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
  1232
      FLAG_SET_DEFAULT(MaxVectorSize, 16);
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
  1233
    }
657b387034fb 7119644: Increase superword's vector size up to 256 bits
kvn
parents: 11881
diff changeset
  1234
#endif // COMPILER2
47582
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1235
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1236
    // Some defaults for AMD family 17h
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1237
    if ( cpu_family() == 0x17 ) {
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1238
      // On family 17h processors use XMM and UnalignedLoadStores for Array Copy
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1239
      if (supports_sse2() && FLAG_IS_DEFAULT(UseXMMForArrayCopy)) {
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1240
        FLAG_SET_DEFAULT(UseXMMForArrayCopy, true);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1241
      }
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1242
      if (supports_sse2() && FLAG_IS_DEFAULT(UseUnalignedLoadStores)) {
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1243
        FLAG_SET_DEFAULT(UseUnalignedLoadStores, true);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1244
      }
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1245
#ifdef COMPILER2
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1246
      if (supports_sse4_2() && FLAG_IS_DEFAULT(UseFPUForSpilling)) {
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1247
        FLAG_SET_DEFAULT(UseFPUForSpilling, true);
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1248
      }
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1249
#endif
fde01e0fccb4 8187219: Newer AMD 17h (EPYC) Processor family defaults
kvn
parents: 47216
diff changeset
  1250
    }
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1251
  }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1252
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1253
  if( is_intel() ) { // Intel cpus specific settings
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1254
    if( FLAG_IS_DEFAULT(UseStoreImmI16) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1255
      UseStoreImmI16 = false; // don't use it on Intel cpus
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1256
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1257
    if( cpu_family() == 6 || cpu_family() == 15 ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1258
      if( FLAG_IS_DEFAULT(UseAddressNop) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1259
        // Use it on all Intel cpus starting from PentiumPro
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1260
        UseAddressNop = true;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1261
      }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1262
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1263
    if( FLAG_IS_DEFAULT(UseXmmLoadAndClearUpper) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1264
      UseXmmLoadAndClearUpper = true; // use movsd on all Intel cpus
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1265
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1266
    if( FLAG_IS_DEFAULT(UseXmmRegToRegMoveAll) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1267
      if( supports_sse3() ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1268
        UseXmmRegToRegMoveAll = true; // use movaps, movapd on new Intel cpus
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1269
      } else {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1270
        UseXmmRegToRegMoveAll = false;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1271
      }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1272
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1273
    if( cpu_family() == 6 && supports_sse3() ) { // New Intel cpus
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1274
#ifdef COMPILER2
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1275
      if( FLAG_IS_DEFAULT(MaxLoopPad) ) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1276
        // For new Intel cpus do the next optimization:
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1277
        // don't align the beginning of a loop if there are enough instructions
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1278
        // left (NumberOfLoopInstrToAlign defined in c2_globals.hpp)
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1279
        // in current fetch line (OptoLoopAlignment) or the padding
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1280
        // is big (> MaxLoopPad).
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1281
        // Set MaxLoopPad to 11 for new Intel cpus to reduce number of
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1282
        // generated NOP instructions. 11 is the largest size of one
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1283
        // address NOP instruction '0F 1F' (see Assembler::nop(i)).
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1284
        MaxLoopPad = 11;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1285
      }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1286
#endif // COMPILER2
13885
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1287
      if (FLAG_IS_DEFAULT(UseXMMForArrayCopy)) {
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1288
        UseXMMForArrayCopy = true; // use SSE2 movq on new Intel cpus
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1289
      }
13885
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1290
      if (supports_sse4_2() && supports_ht()) { // Newest Intel cpus
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1291
        if (FLAG_IS_DEFAULT(UseUnalignedLoadStores)) {
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1292
          UseUnalignedLoadStores = true; // use movdqu on newest Intel cpus
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1293
        }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1294
      }
39256
ac12f57c6d9c 8158214: Crash with "assert(VM_Version::supports_sse4_1()) failed" if UseSSE < 4 is set
thartmann
parents: 38135
diff changeset
  1295
      if (supports_sse4_2()) {
13885
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1296
        if (FLAG_IS_DEFAULT(UseSSE42Intrinsics)) {
34207
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1297
          FLAG_SET_DEFAULT(UseSSE42Intrinsics, true);
2348
4e71ed4c2709 6761600: Use sse 4.2 in intrinsics
cfang
parents: 2255
diff changeset
  1298
        }
34207
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1299
      } else {
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1300
        if (UseSSE42Intrinsics && !FLAG_IS_DEFAULT(UseAESIntrinsics)) {
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1301
          warning("SSE4.2 intrinsics require SSE4.2 instructions or higher. Intrinsics will be disabled.");
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1302
        }
a5f1c458b56e 8143208: compiler/c1/6855215/Test6855215.java supports_sse2() failed
zmajo
parents: 34176
diff changeset
  1303
        FLAG_SET_DEFAULT(UseSSE42Intrinsics, false);
2348
4e71ed4c2709 6761600: Use sse 4.2 in intrinsics
cfang
parents: 2255
diff changeset
  1304
      }
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1305
    }
46563
cfca8fbb4051 8182138: Disable generating INC and DEC instructions on Xeon Phi and ATOM CPUs
kvn
parents: 46560
diff changeset
  1306
    if (is_atom_family() || is_knights_family()) {
25932
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1307
#ifdef COMPILER2
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1308
      if (FLAG_IS_DEFAULT(OptoScheduling)) {
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1309
        OptoScheduling = true;
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1310
      }
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1311
#endif
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1312
      if (supports_sse4_2()) { // Silvermont
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1313
        if (FLAG_IS_DEFAULT(UseUnalignedLoadStores)) {
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1314
          UseUnalignedLoadStores = true; // use movdqu on newest Intel cpus
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1315
        }
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1316
      }
46563
cfca8fbb4051 8182138: Disable generating INC and DEC instructions on Xeon Phi and ATOM CPUs
kvn
parents: 46560
diff changeset
  1317
      if (FLAG_IS_DEFAULT(UseIncDec)) {
cfca8fbb4051 8182138: Disable generating INC and DEC instructions on Xeon Phi and ATOM CPUs
kvn
parents: 46560
diff changeset
  1318
        FLAG_SET_DEFAULT(UseIncDec, false);
cfca8fbb4051 8182138: Disable generating INC and DEC instructions on Xeon Phi and ATOM CPUs
kvn
parents: 46560
diff changeset
  1319
      }
25932
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1320
    }
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1321
    if(FLAG_IS_DEFAULT(AllocatePrefetchInstr) && supports_3dnow_prefetch()) {
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1322
      FLAG_SET_DEFAULT(AllocatePrefetchInstr, 3);
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1323
    }
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1324
  }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1325
35110
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1326
#ifdef _LP64
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1327
  if (UseSSE42Intrinsics) {
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1328
    if (FLAG_IS_DEFAULT(UseVectorizedMismatchIntrinsic)) {
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1329
      UseVectorizedMismatchIntrinsic = true;
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1330
    }
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1331
  } else if (UseVectorizedMismatchIntrinsic) {
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1332
    if (!FLAG_IS_DEFAULT(UseVectorizedMismatchIntrinsic))
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1333
      warning("vectorizedMismatch intrinsics are not available on this CPU");
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1334
    FLAG_SET_DEFAULT(UseVectorizedMismatchIntrinsic, false);
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1335
  }
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1336
#else
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1337
  if (UseVectorizedMismatchIntrinsic) {
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1338
    if (!FLAG_IS_DEFAULT(UseVectorizedMismatchIntrinsic)) {
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1339
      warning("vectorizedMismatch intrinsic is not available in 32-bit VM");
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1340
    }
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1341
    FLAG_SET_DEFAULT(UseVectorizedMismatchIntrinsic, false);
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1342
  }
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1343
#endif // _LP64
f19bcdf40799 8143355: Update for addition of vectorizedMismatch intrinsic for x86
kvn
parents: 34207
diff changeset
  1344
23220
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1345
  // Use count leading zeros count instruction if available.
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1346
  if (supports_lzcnt()) {
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1347
    if (FLAG_IS_DEFAULT(UseCountLeadingZerosInstruction)) {
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1348
      UseCountLeadingZerosInstruction = true;
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1349
    }
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1350
   } else if (UseCountLeadingZerosInstruction) {
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1351
    warning("lzcnt instruction is not available on this CPU");
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1352
    FLAG_SET_DEFAULT(UseCountLeadingZerosInstruction, false);
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1353
  }
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1354
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1355
  // Use count trailing zeros instruction if available
23220
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1356
  if (supports_bmi1()) {
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1357
    // tzcnt does not require VEX prefix
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1358
    if (FLAG_IS_DEFAULT(UseCountTrailingZerosInstruction)) {
27414
39d976b80fb4 8059139: It should be possible to explicitly disable usage of TZCNT instr w/ -XX:-UseBMI1Instructions
kvn
parents: 26434
diff changeset
  1359
      if (!UseBMI1Instructions && !FLAG_IS_DEFAULT(UseBMI1Instructions)) {
39d976b80fb4 8059139: It should be possible to explicitly disable usage of TZCNT instr w/ -XX:-UseBMI1Instructions
kvn
parents: 26434
diff changeset
  1360
        // Don't use tzcnt if BMI1 is switched off on command line.
39d976b80fb4 8059139: It should be possible to explicitly disable usage of TZCNT instr w/ -XX:-UseBMI1Instructions
kvn
parents: 26434
diff changeset
  1361
        UseCountTrailingZerosInstruction = false;
39d976b80fb4 8059139: It should be possible to explicitly disable usage of TZCNT instr w/ -XX:-UseBMI1Instructions
kvn
parents: 26434
diff changeset
  1362
      } else {
39d976b80fb4 8059139: It should be possible to explicitly disable usage of TZCNT instr w/ -XX:-UseBMI1Instructions
kvn
parents: 26434
diff changeset
  1363
        UseCountTrailingZerosInstruction = true;
39d976b80fb4 8059139: It should be possible to explicitly disable usage of TZCNT instr w/ -XX:-UseBMI1Instructions
kvn
parents: 26434
diff changeset
  1364
      }
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1365
    }
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1366
  } else if (UseCountTrailingZerosInstruction) {
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1367
    warning("tzcnt instruction is not available on this CPU");
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1368
    FLAG_SET_DEFAULT(UseCountTrailingZerosInstruction, false);
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1369
  }
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1370
27414
39d976b80fb4 8059139: It should be possible to explicitly disable usage of TZCNT instr w/ -XX:-UseBMI1Instructions
kvn
parents: 26434
diff changeset
  1371
  // BMI instructions (except tzcnt) use an encoding with VEX prefix.
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1372
  // VEX prefix is generated only when AVX > 0.
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1373
  if (supports_bmi1() && supports_avx()) {
23220
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1374
    if (FLAG_IS_DEFAULT(UseBMI1Instructions)) {
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1375
      UseBMI1Instructions = true;
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1376
    }
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1377
  } else if (UseBMI1Instructions) {
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1378
    warning("BMI1 instructions are not available on this CPU (AVX is also required)");
23220
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1379
    FLAG_SET_DEFAULT(UseBMI1Instructions, false);
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1380
  }
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1381
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1382
  if (supports_bmi2() && supports_avx()) {
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1383
    if (FLAG_IS_DEFAULT(UseBMI2Instructions)) {
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1384
      UseBMI2Instructions = true;
23220
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1385
    }
26434
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1386
  } else if (UseBMI2Instructions) {
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1387
    warning("BMI2 instructions are not available on this CPU (AVX is also required)");
09ad55e5f486 8055494: Add C2 x86 intrinsic for BigInteger::multiplyToLen() method
kvn
parents: 26306
diff changeset
  1388
    FLAG_SET_DEFAULT(UseBMI2Instructions, false);
23220
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1389
  }
fc827339dc37 8031321: Support Intel bit manipulation instructions
iveresov
parents: 18507
diff changeset
  1390
2255
54abdf3e1055 6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents: 2111
diff changeset
  1391
  // Use population count instruction if available.
54abdf3e1055 6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents: 2111
diff changeset
  1392
  if (supports_popcnt()) {
54abdf3e1055 6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents: 2111
diff changeset
  1393
    if (FLAG_IS_DEFAULT(UsePopCountInstruction)) {
54abdf3e1055 6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents: 2111
diff changeset
  1394
      UsePopCountInstruction = true;
54abdf3e1055 6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents: 2111
diff changeset
  1395
    }
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
  1396
  } else if (UsePopCountInstruction) {
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
  1397
    warning("POPCNT instruction is not available on this CPU");
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
  1398
    FLAG_SET_DEFAULT(UsePopCountInstruction, false);
2255
54abdf3e1055 6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents: 2111
diff changeset
  1399
  }
54abdf3e1055 6378821: bitCount() should use POPC on SPARC processors and AMD+10h
twisti
parents: 2111
diff changeset
  1400
15114
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1401
  // Use fast-string operations if available.
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1402
  if (supports_erms()) {
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1403
    if (FLAG_IS_DEFAULT(UseFastStosb)) {
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1404
      UseFastStosb = true;
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1405
    }
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1406
  } else if (UseFastStosb) {
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1407
    warning("fast-string operations are not available on this CPU");
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1408
    FLAG_SET_DEFAULT(UseFastStosb, false);
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1409
  }
4074553c678b 8005522: use fast-string instructions on x86 for zeroing
kvn
parents: 14834
diff changeset
  1410
50534
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1411
  // Use XMM/YMM MOVDQU instruction for Object Initialization
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1412
  if (!UseFastStosb && UseSSE >= 2 && UseUnalignedLoadStores) {
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1413
    if (FLAG_IS_DEFAULT(UseXMMForObjInit)) {
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1414
      UseXMMForObjInit = true;
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1415
    }
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1416
  } else if (UseXMMForObjInit) {
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1417
    warning("UseXMMForObjInit requires SSE2 and unaligned load/stores. Feature is switched off.");
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1418
    FLAG_SET_DEFAULT(UseXMMForObjInit, false);
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1419
  }
a6a44177f99c 8201193: Use XMM/YMM for objects initialization
kvn
parents: 50261
diff changeset
  1420
13885
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1421
#ifdef COMPILER2
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1422
  if (FLAG_IS_DEFAULT(AlignVector)) {
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1423
    // Modern processors allow misaligned memory operations for vectors.
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1424
    AlignVector = !UseUnalignedLoadStores;
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1425
  }
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1426
#endif // COMPILER2
6b056026ecad 7199010: incorrect vector alignment
kvn
parents: 13294
diff changeset
  1427
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1428
  if (FLAG_IS_DEFAULT(AllocatePrefetchInstr)) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1429
    if (AllocatePrefetchInstr == 3 && !supports_3dnow_prefetch()) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1430
      FLAG_SET_DEFAULT(AllocatePrefetchInstr, 0);
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1431
    } else if (!supports_sse() && supports_3dnow_prefetch()) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1432
      FLAG_SET_DEFAULT(AllocatePrefetchInstr, 3);
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1433
    }
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1434
  }
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1435
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1436
  // Allocation prefetch settings
10267
8bdeec886dc4 7079329: Adjust allocation prefetching for T4
kvn
parents: 10010
diff changeset
  1437
  intx cache_line_size = prefetch_data_size();
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1438
  if (FLAG_IS_DEFAULT(AllocatePrefetchStepSize) &&
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1439
      (cache_line_size > AllocatePrefetchStepSize)) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1440
    FLAG_SET_DEFAULT(AllocatePrefetchStepSize, cache_line_size);
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1441
  }
10267
8bdeec886dc4 7079329: Adjust allocation prefetching for T4
kvn
parents: 10010
diff changeset
  1442
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1443
  if ((AllocatePrefetchDistance == 0) && (AllocatePrefetchStyle != 0)) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1444
    assert(!FLAG_IS_DEFAULT(AllocatePrefetchDistance), "default value should not be 0");
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1445
    if (!FLAG_IS_DEFAULT(AllocatePrefetchStyle)) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1446
      warning("AllocatePrefetchDistance is set to 0 which disable prefetching. Ignoring AllocatePrefetchStyle flag.");
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1447
    }
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1448
    FLAG_SET_DEFAULT(AllocatePrefetchStyle, 0);
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1449
  }
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1450
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1451
  if (FLAG_IS_DEFAULT(AllocatePrefetchDistance)) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1452
    bool use_watermark_prefetch = (AllocatePrefetchStyle == 2);
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1453
    FLAG_SET_DEFAULT(AllocatePrefetchDistance, allocate_prefetch_distance(use_watermark_prefetch));
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1454
  }
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1455
25932
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1456
  if (is_intel() && cpu_family() == 6 && supports_sse3()) {
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1457
    if (FLAG_IS_DEFAULT(AllocatePrefetchLines) &&
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1458
        supports_sse4_2() && supports_ht()) { // Nehalem based cpus
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1459
      FLAG_SET_DEFAULT(AllocatePrefetchLines, 4);
25932
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1460
    }
6272
94a20ad0e9de 6978249: spill between cpu and fpu registers when those moves are fast
never
parents: 5902
diff changeset
  1461
#ifdef COMPILER2
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1462
    if (FLAG_IS_DEFAULT(UseFPUForSpilling) && supports_sse4_2()) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1463
      FLAG_SET_DEFAULT(UseFPUForSpilling, true);
25932
15d133edd8f6 8052081: Optimize generated by C2 code for Intel's Atom processor
kvn
parents: 25633
diff changeset
  1464
    }
6272
94a20ad0e9de 6978249: spill between cpu and fpu registers when those moves are fast
never
parents: 5902
diff changeset
  1465
#endif
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1466
  }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1467
48489
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1468
  if (is_zx() && ((cpu_family() == 6) || (cpu_family() == 7)) && supports_sse4_2()) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1469
#ifdef COMPILER2
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1470
    if (FLAG_IS_DEFAULT(UseFPUForSpilling)) {
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1471
      FLAG_SET_DEFAULT(UseFPUForSpilling, true);
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1472
    }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1473
#endif
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1474
  }
a5548cf24286 8194279: support zhaoxin x86 cpu vendor ids CentaurHauls and Shanghai
dholmes
parents: 48195
diff changeset
  1475
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1476
#ifdef _LP64
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1477
  // Prefetch settings
46547
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1478
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1479
  // Prefetch interval for gc copy/scan == 9 dcache lines.  Derived from
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1480
  // 50-warehouse specjbb runs on a 2-way 1.8ghz opteron using a 4gb heap.
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1481
  // Tested intervals from 128 to 2048 in increments of 64 == one cache line.
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1482
  // 256 bytes (4 dcache lines) was the nearest runner-up to 576.
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1483
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1484
  // gc copy/scan is disabled if prefetchw isn't supported, because
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1485
  // Prefetch::write emits an inlined prefetchw on Linux.
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1486
  // Do not use the 3dnow prefetchw instruction.  It isn't supported on em64t.
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1487
  // The used prefetcht0 instruction works for both amd64 and em64t.
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1488
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1489
  if (FLAG_IS_DEFAULT(PrefetchCopyIntervalInBytes)) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1490
    FLAG_SET_DEFAULT(PrefetchCopyIntervalInBytes, 576);
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1491
  }
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1492
  if (FLAG_IS_DEFAULT(PrefetchScanIntervalInBytes)) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1493
    FLAG_SET_DEFAULT(PrefetchScanIntervalInBytes, 576);
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1494
  }
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1495
  if (FLAG_IS_DEFAULT(PrefetchFieldsAhead)) {
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1496
    FLAG_SET_DEFAULT(PrefetchFieldsAhead, 1);
e1b926a0b23f 8016470: AllocatePrefetchDistance is not changed by command line
rraghavan
parents: 46546
diff changeset
  1497
  }
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1498
#endif
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1499
15193
8e6b5694267f 8003985: Support @Contended Annotation - JEP 142
jwilhelm
parents: 14834
diff changeset
  1500
  if (FLAG_IS_DEFAULT(ContendedPaddingWidth) &&
8e6b5694267f 8003985: Support @Contended Annotation - JEP 142
jwilhelm
parents: 14834
diff changeset
  1501
     (cache_line_size > ContendedPaddingWidth))
8e6b5694267f 8003985: Support @Contended Annotation - JEP 142
jwilhelm
parents: 14834
diff changeset
  1502
     ContendedPaddingWidth = cache_line_size;
8e6b5694267f 8003985: Support @Contended Annotation - JEP 142
jwilhelm
parents: 14834
diff changeset
  1503
30209
8ea30dc99369 8026049: (bf) Intrinsify ByteBuffer.put{Int, Double, Float, ...} methods
aph
parents: 28954
diff changeset
  1504
  // This machine allows unaligned memory accesses
8ea30dc99369 8026049: (bf) Intrinsify ByteBuffer.put{Int, Double, Float, ...} methods
aph
parents: 28954
diff changeset
  1505
  if (FLAG_IS_DEFAULT(UseUnalignedAccesses)) {
8ea30dc99369 8026049: (bf) Intrinsify ByteBuffer.put{Int, Double, Float, ...} methods
aph
parents: 28954
diff changeset
  1506
    FLAG_SET_DEFAULT(UseUnalignedAccesses, true);
8ea30dc99369 8026049: (bf) Intrinsify ByteBuffer.put{Int, Double, Float, ...} methods
aph
parents: 28954
diff changeset
  1507
  }
8ea30dc99369 8026049: (bf) Intrinsify ByteBuffer.put{Int, Double, Float, ...} methods
aph
parents: 28954
diff changeset
  1508
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1509
#ifndef PRODUCT
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1510
  if (log_is_enabled(Info, os, cpu)) {
46701
f559541c0daa 8181917: Refactor UL LogStreams to avoid using resource area
stuefe
parents: 46698
diff changeset
  1511
    LogStream ls(Log(os, cpu)::info());
f559541c0daa 8181917: Refactor UL LogStreams to avoid using resource area
stuefe
parents: 46698
diff changeset
  1512
    outputStream* log = &ls;
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1513
    log->print_cr("Logical CPUs per core: %u",
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1514
                  logical_processors_per_package());
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1515
    log->print_cr("L1 data cache line size: %u", L1_data_cache_line_size());
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1516
    log->print("UseSSE=%d", (int) UseSSE);
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
  1517
    if (UseAVX > 0) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1518
      log->print("  UseAVX=%d", (int) UseAVX);
11427
bf248009cbbe 7116452: Add support for AVX instructions
kvn
parents: 10565
diff changeset
  1519
    }
14132
3c1437abcefd 7184394: add intrinsics to use AES instructions
kvn
parents: 13886
diff changeset
  1520
    if (UseAES) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1521
      log->print("  UseAES=1");
14132
3c1437abcefd 7184394: add intrinsics to use AES instructions
kvn
parents: 13886
diff changeset
  1522
    }
23487
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1523
#ifdef COMPILER2
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1524
    if (MaxVectorSize > 0) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1525
      log->print("  MaxVectorSize=%d", (int) MaxVectorSize);
23487
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1526
    }
0f7e268cd9e3 8037226: compiler/7196199/Test7196199.java fails on 32-bit linux with MaxVectorSize > 16
kvn
parents: 23220
diff changeset
  1527
#endif
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1528
    log->cr();
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1529
    log->print("Allocation");
46630
75aa3e39d02c 8182299: Enable disabled clang warnings, build on OSX 10 + Xcode 8
jwilhelm
parents: 46563
diff changeset
  1530
    if (AllocatePrefetchStyle <= 0 || (UseSSE == 0 && !supports_3dnow_prefetch())) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1531
      log->print_cr(": no prefetching");
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1532
    } else {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1533
      log->print(" prefetching: ");
9135
f76543993e9d 7035713: 3DNow Prefetch Instruction Support
kvn
parents: 8921
diff changeset
  1534
      if (UseSSE == 0 && supports_3dnow_prefetch()) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1535
        log->print("PREFETCHW");
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1536
      } else if (UseSSE >= 1) {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1537
        if (AllocatePrefetchInstr == 0) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1538
          log->print("PREFETCHNTA");
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1539
        } else if (AllocatePrefetchInstr == 1) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1540
          log->print("PREFETCHT0");
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1541
        } else if (AllocatePrefetchInstr == 2) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1542
          log->print("PREFETCHT2");
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1543
        } else if (AllocatePrefetchInstr == 3) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1544
          log->print("PREFETCHW");
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1545
        }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1546
      }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1547
      if (AllocatePrefetchLines > 1) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1548
        log->print_cr(" at distance %d, %d lines of %d bytes", (int) AllocatePrefetchDistance, (int) AllocatePrefetchLines, (int) AllocatePrefetchStepSize);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1549
      } else {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1550
        log->print_cr(" at distance %d, one line of %d bytes", (int) AllocatePrefetchDistance, (int) AllocatePrefetchStepSize);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1551
      }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1552
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1553
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1554
    if (PrefetchCopyIntervalInBytes > 0) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1555
      log->print_cr("PrefetchCopyIntervalInBytes %d", (int) PrefetchCopyIntervalInBytes);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1556
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1557
    if (PrefetchScanIntervalInBytes > 0) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1558
      log->print_cr("PrefetchScanIntervalInBytes %d", (int) PrefetchScanIntervalInBytes);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1559
    }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1560
    if (PrefetchFieldsAhead > 0) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1561
      log->print_cr("PrefetchFieldsAhead %d", (int) PrefetchFieldsAhead);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1562
    }
15193
8e6b5694267f 8003985: Support @Contended Annotation - JEP 142
jwilhelm
parents: 14834
diff changeset
  1563
    if (ContendedPaddingWidth > 0) {
37430
fd743dadef12 8151939: VM_Version_init() print buffer is too small
coleenp
parents: 36561
diff changeset
  1564
      log->print_cr("ContendedPaddingWidth %d", (int) ContendedPaddingWidth);
15193
8e6b5694267f 8003985: Support @Contended Annotation - JEP 142
jwilhelm
parents: 14834
diff changeset
  1565
    }
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1566
  }
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1567
#endif // !PRODUCT
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1568
}
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1569
23491
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1570
bool VM_Version::use_biased_locking() {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1571
#if INCLUDE_RTM_OPT
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1572
  // RTM locking is most useful when there is high lock contention and
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1573
  // low data contention.  With high lock contention the lock is usually
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1574
  // inflated and biased locking is not suitable for that case.
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1575
  // RTM locking code requires that biased locking is off.
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1576
  // Note: we can't switch off UseBiasedLocking in get_processor_features()
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1577
  // because it is used by Thread::allocate() which is called before
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1578
  // VM_Version::initialize().
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1579
  if (UseRTMLocking && UseBiasedLocking) {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1580
    if (FLAG_IS_DEFAULT(UseBiasedLocking)) {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1581
      FLAG_SET_DEFAULT(UseBiasedLocking, false);
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1582
    } else {
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1583
      warning("Biased locking is not supported with RTM locking; ignoring UseBiasedLocking flag." );
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1584
      UseBiasedLocking = false;
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1585
    }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1586
  }
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1587
#endif
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1588
  return UseBiasedLocking;
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1589
}
f690330b10b9 8031320: Use Intel RTM instructions for locks
kvn
parents: 23487
diff changeset
  1590
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1591
void VM_Version::initialize() {
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1592
  ResourceMark rm;
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1593
  // Making this stub must be FIRST use of assembler
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1594
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
  1595
  stub_blob = BufferBlob::create("get_cpu_info_stub", stub_size);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1596
  if (stub_blob == NULL) {
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
  1597
    vm_exit_during_initialization("Unable to allocate get_cpu_info_stub");
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1598
  }
6418
6671edbd230e 6978355: renaming for 6961697
twisti
parents: 6272
diff changeset
  1599
  CodeBuffer c(stub_blob);
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1600
  VM_Version_StubGenerator g(&c);
23527
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
  1601
  get_cpu_info_stub = CAST_TO_FN_PTR(get_cpu_info_stub_t,
397b6816032d 8038633: crash in VM_Version::get_processor_features() on startup
kvn
parents: 23491
diff changeset
  1602
                                     g.generate_get_cpu_info());
2111
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1603
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1604
  get_processor_features();
dab8a43dd738 6808589: Merge vm_version_x86_{32,64}.{cpp,hpp}
twisti
parents:
diff changeset
  1605
}